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2. The nucleic acid of Claim 1 , wherein said nucleotide sequence comprises a nucleotide sequence 
selected from the group consisting of the sequence shown in Figure 1 (SEQ ID NO:3), Figure 3 (SEQ ID NO:5), 
Figure 5 (SEQ ID NO:7), Figure 7 (SEQ ID NO:9), Figure 9 (SEQ ID NO: 11), Figure 11 (SEQ ID NO: 16). 
Figure 13 (SEQ ID NO:21). Figure 15 (SEQ ID NO:23), Figure 17 (SEQ ID NO:28), Figure 19 (SEQ ID 
NO:30), Figure 21 (SEQ ID NO:32), Figure 23 (SEQ ID NO:40), Figure 25 (SEQ ID NO:42), Figure 27 (SEQ 
ID NO:49), Figure 29 (SEQ ID NO:5l), Figure 31 (SEQ ID NO:53), Figure 33 (SEQ ID NO:55), Figure 35 
(SEQ ID NO:57), Figure 37 (SEQ ID NO:62), Figure 39 (SEQ ID NO:67), Figure 41 (SEQ ID NO:69), Figure 
43 (SEQ ID NO;71), Figure 45 (SEQ ID NO:76), Figure 47 (SEQ ID NO:78), Figure 49 (SEQ ID NO:83), 
Figure 51 (SEQ ID NO:85), Figure 53 (SEQ ID NO:87), Figure 55 (SEQ ID NO:94), Figure 57 (SEQ ID 
N0:99), Figure 59 (SEQ ID NO: 101), Figure 61 (SEQ ID NO: 103). Figure 63 (SEQ ID NO: 110), Figure 65 
(SEQ ID NO: 115), Figure 67 (SEQ ID NO: 117). Figure 69 (SEQ ID NO: 122), Figure 71 (SEQ ID NO: 127), 
Figure 73 (SEQ ID NO: 129), Figure 75 (SEQ ID NO:13I), Figure 77 (SEQ ID NO:133), Figure 79 (SEQ ID 
NO: 135), Figure 81 (SEQ ID NO: 137), Figure 83 (SEQ ID NO: 139), Figure 85 (SEQ ID NO: 141), Figure 87 
(SEQ ID NO: 143), Figure 89 (SEQ ID NO: 145), Figure 91 (SEQ ID NO: 147), Figure 93 (SEQ ID NO: 152), 
Figure 95 (SEQ ID NO: 157), Figure 97 (SEQ ID NO: 159), Figure 99 (SEQ ID NO: 161), Figure 101 (SEQ ID 
15 NO: 169), Figure 103 (SEQ ID NO: 179), Figure 105 (SEQ ID NO: 188), Figure 107 (SEQ ID NO: 193), Figure 
25 109 (SEQ ID NO:195), Figure 111 (SEQ ID NO: 197), Figure 113 (SEQ ID NO:202), Figure 115 (SEQ ID 

NO:209), Figure 117 (SEQ ID NO:21 1), Figure 1 19 (SEQ ID NO:213), Figure 121 (SEQ ID NO:215), Figure 
123 (SEQ ID NO:217), Figure 125 (SEQ ID NO:219), Figure 127 (SEQ ID NO:224), Figure 129 (SEQ ID 
NO:226), Figure 131 (SEQ ID NO:228), Figure 133 (SEQ ID NO:233), Figure 135 (SEQ ID NO:235), Figure 
30 20 137 (SEQ ID NO:242), Figure 139 (SEQ ID NO:247), Figure 141 (SEQ ID NO:252), Figure 143 (SEQ ID 

NO:259), Figure 145 (SEQ ID NO:264), Figure 147 (SEQ ID NO:266), Figure 149 (SEQ ID NO:268), Figure 
151 (SEQ ID NO:270), Figure 153 (SEQ ID NO:272), Figure 155 (SEQ ID NO:274) f Figure 157 (SEQ ID 
NO:276), Figure 159 (SEQ ID NO:28l), Figure 161 (SEQ ID NO:286), Figure 163 (SEQ ID NO:291), Figure 
35 165 < S£ Q m N( *296), Figure 167 (SEQ ID NO:301), Figure 169 (SEQ ID NQ:303), Figure 171 (SEQ ID 

25 NO:305), Figure 173 (SEQ ID NO:307), Figure 175 (SEQ ID NO:309), Figure 177 (SEQ ID NO:314), Figure 
179 (SEQ ID NO:316), Figure 181 (SEQ ID NO:321), Figure 183 (SEQ ID NO:323), Figure 185 (SEQ ID 
NO:325). Figure 187 (SEQ ID NO:327), Figure 189 (SEQ ID NO:329), Figure 191 (SEQ ID NO:331), Figure 
193 (SEQ ID NO:333). Figure 195 (SEQ ID NO:335), Figure 197 (SEQ ID NO:337). Figure 199 (SEQ ID 
NO:339), Figure 201 (SEQ ID NO:346), Figure 203 (SEQ ID NO:351), Figure 205 (SEQ TD NO:353), Figure 
30 207 (SEQ ID NO:355), Figure 209 (SEQ ID NO:357). Figure 21 1 (SEQ ID NO:363), Figure 213 (SEQ ID 
NO:365), Figure 215 (SEQ ID NO:371), Figure 217 (SEQ ID NO:373). Figure 219 (SEQ ID NO:375), Figure 
221 (SEQ ID NO:377), Figure 223 (SEQ ID NO:382), Figure 225 (SEQ ID NO:384), Figure 227 (SEQ ID 
NO:389), Figure 229 (SEQ ID NO:394), Figure 231 (SEQ ID NO:396), Figure 233 (SEQ ID NO:401). Figure 
235 (SEQ ID NO:405), Figure 237 (SEQ ID NO:409), Figure 239 (SEQ ID NO:414), Figure 241 (SEQ ID 
35 NO:422), Figure 242 (SEQ ID NO:428) and Figure 245 (SEQ ID NO:430). 
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3 . The nucleic acid of Claim 1 , wherein said nucleotide sequence comprises a nucleotide sequence 
selected from the group consisting of the full-length coding sequence of the sequence shown in Figure 1 (SEQ 
ID NO:3), Figure 3 (SEQ rD NO:5), Figure 5 (SEQ ID NO:7), Figure 7 (SEQ ID NO:9), Figure 9 (SEQ ID 
NO: 1 1), Figure 1 1 (SEQ ID NO: 16), Figure 13 (SEQ ID NO:21), Figure 15 (SEQ ID NO:23), Figure 17 (SEQ 
ID NO:28), Figure 19 (SEQ ID NO:30), Figure 21 (SEQ ID NO:32), Figure 23 (SEQ ID NO:40), Figure 25 
5 (SEQ ID NO:42), Figure 27 (SEQ ID NO:49), Figure 29 (SEQ ID NO:51), Figure 3 1 (SEQ ID NO:53), Figure 
_ 33 (SEQ ID NO:55), Figure 35 (SEQ ID NO:57), Figure 37 (SEQ ID NO:62), Figure 39 (SEQ ID NO:67), 
Figure 41 (SEQ ID NO:69), Figure 43 (SEQ ID NO:71), Figure 45 (SEQ ID NO:76), Figure 47 (SEQ ID 
NO:78), Figure 49 (SEQ ID NO:83), Figure 51 (SEQ ID NO:85), Figure 53 (SEQ ID NO:87), Figure 55 (SEQ 
ID NO:94), Figure 57 (SEQ ID NO:99), Figure 59 (SEQ ID NO:101), Figure 61 (SEQ ID NO:103), Figure 
10 63 (SEQ ID NO: 110). Figure 65 (SEQ ID NO: 1 15), Figure 67 (SEQ ID NO: 1 17), Figure 69 (SEQ ID NO: 122), 
Figure 71 (SEQ ID NO:127), Figure 73 (SEQ ID NO:129), Figure 75 (SEQ ID NO:131), Figure 77 (SEQ ID 
NO: 133), Figure 79 (SEQ ID NO: 135), Figure 81 (SEQ ID NO: 1 37), Figure 83 (SEQ ID NO: 139), Figure 85 
(SEQ ID NO:14I), Figure 87 (SEQ ID NO:143), Figure 89 (SEQ ID NO:145), Figure 91 (SEQ ID NO:147), 
Figure 93 (SEQ ID NO:152), Figure 95 (SEQ ID NO:157), Figure 97 (SEQ ID NO:159), Figure 99 (SEQ ID 
15 NO: 161), Figure 101 (SEQ ID NO: 169), Figure 103 (SEQ ID NO: 179), Figure 105 (SEQ ID NO: 188), Figure 
107 (SEQ ID NO:193), Figure 109 (SEQ ID NO:195), Figure 111 (SEQ ID NO:197), Figure 113 (SEQ ID 
NO:202), Figure 1 15 (SEQ ID NO:209), Figure 1 17 (SEQ ID NO:21 1), Figure 119 (SEQ ID NO:213), Figure 
121 (SEQ ID NO:215), Figure 123 (SEQ ID NO:217), Figure 125 (SEQ ID NO:219), Figure 127 (SEQ ID 
NO:224), Figure 129 (SEQ ID NO:226), Figure 131 (SEQ ID NO:228), Figure 133 (SEQ ID NO:233), Figure 
135 (SEQ ID NO:235), Figure 137 (SEQ ID NO:242), Figure 139 (SEQ ID NO:247), Figure 141 (SEQ ID 
NO:252), Figure 143 (SEQ ID NO:259), Figure 145 (SEQ ID NO:264), Figure 147 (SEQ ID NO:266), Figure 
149 (SEQ ID NO:268), Figure 151 (SEQ ID NO:270), Figure 153 (SEQ ID NO:272), Figure 155 (SEQ ID 
NO:274). Figure 157 (SEQ ID NO:276), Figure 159 (SEQ ID NO:281), Figure 161 (SEQ ID NO:286), Figure 
163 (SEQ ID NO:291), Figure 165 (SEQ ID NO:296), Figure 167 (SEQ ID NO:301). Figure 169 (SEQ ID 
NO:303), Figure 171 (SEQ ID NO:305), Figure 173 (SEQ ID NO:307), Figure 175 (SEQ ID NO:309), Figure 
177 (SEQ ID NO:314), Figure 179 (SEQ ID NO:316), Figure 181 (SEQ ID NO:32I), Figure 183 (SEQ ID 
NO:323), Figure 185 (SEQ ID NO:325), Figure 187 (SEQ ID NO:327), Figure 189 (SEQ ID NO:329), Figure 
191 (SEQ ID NO:331), Figure 193 (SEQ ID NO:333), Figure 195 (SEQ ID NO:335), Figure 197 (SEQ ID 
NO:337), Figure 199 (SEQ ID NO:339), Figure 201 (SEQ ID NO:346), Figure 203 (SEQ ID NO:351), Figure 
205 (SEQ ID NO:353), Figure 207 (SEQ ID NO:355), Figure 209 (SEQ ID NO:357), Figure 211 (SEQ ID 
NO:363), Figure 213 (SEQ ID NO:365), Figure 215 (SEQ ID NO:371), Figure 217 (SEQ ID NO:373), Figure 
219 (SEQ ID NO:375), Figure 221 (SEQ ID NO:377), Figure 223 (SEQ ID NO:382), Figure 225 (SEQ ID 
NO:384), Figure 227 (SEQ ID NO:389), Figure 229 (SEQ ID NO:394), Figure 231 (SEQ ID NO:396), Figure 
233 (SEQ ID NO:401), Figure 235 (SEQ ID NO:405), Figure 237 (SEQ ID NO:409), Figure 239 (SEQ ID 
NO:414), Figure 241 (SEQ ID NO:422), Figure 242 (SEQ ID NO:428) and Figure 245 (SEQ ID NO:430). 
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4. Isolated nucleic acid which comprises the full-length coding sequence of the DNA deposited 
under any ATCC accession number shown in Table 2. 

5. A vector comprising the nucleic acid of Claim 1 . 

6. The vector of Claim 5 operably linked to control sequences recognized by a host cell 
transformed with the vector. 

7. A host cell comprising the vector of Claim 5. 

8. The host cell of Claim 7 wherein said cell is a CHO cell. 

9. The host cell of Claim 7 wherein said cell is an E. coli. 

10. The host cell of Claim 7 wherein said cell is a yeast cell. 

11. A process for producing a PRO polypeptides comprising culruring the host cell of Claim 7 
under conditions suitable for expression of said PRO polypeptide and recovering said PRO polypeptide from the 
cell culture. 

12. Isolated PRO polypeptide having at least 80% sequence identity to an amino acid sequence 
selected from the group consisting of the amino acid sequence shown in Figure 2 (SEQ ID NO:4), Figure 4 (SEQ 
ID NO:6), Figure 6 (SEQ ID NO:8), Figure 8 (SEQ ID NO:10), Figure 10 (SEQ ID NO:12), Figure 12 (SEQ 
ID NO: 17), Figure 14 (SEQ ID NO:22), Figure 16 (SEQ ID NO:24), Figure 18 (SEQ ID NO:29), Figure 20 
(SEQ ID NO:31), Figure 22 (SEQ ID NO:33), Figure 24 (SEQ ID NO:41), Figure 26 (SEQ ID NO:43), Figure 
28 (SEQ ID NO:50), Figure 30 (SEQ ID NO:52), Figure 32 (SEQ ID NO:54), Figure 34 (SEQ ID NO:56), 
Figure 36 (SEQ ID NO:58), Figure 38 (SEQ ID NO:63), Figure 40 (SEQ ID NO:68), Figure 42 (SEQ ID 
NO:70), Figure 44 (SEQ ID NO:72), Figure 46 (SEQ ID NO:77), Figure 48 (SEQ ID NO:79), Figure 50 (SEQ 
ID NO:84), Figure 52 (SEQ ID NO:86), Figure 54 (SEQ ID NO:88), Figure 56 (SEQ ID NO:95), Figure 58 
(SEQ ID NO:100), Figure 60 (SEQ ID NO:102), Figure 62 (SEQ ID NO:104), Figure 64 (SEQ ID NO:lll), 
Figure 66 (SEQ ID NO:116), Figure 68 (SEQ ID NO:lI8), Figure 70 (SEQ ID N0.123), Figure 72 (SEQ ID 
NO: 128), Figure 74 (SEQ ID NO: 130), Figure 76 (SEQ ID NO: 132), Figure 78 (SEQ ID NO: 134), Figure 80 
(SEQ ID N0.136), Figure 82 (SEQ ID NO:138), Figure 84 (SEQ ID NO:140), Figure 86 (SEQ ID NO: 142), 
Figure 88 (SEQ ED NO: 144), Figure 90 (SEQ ID NO: 146), Figure 92 (SEQ ID NO: 148), Figure 94 (SEQ ID 
NO:153), Figure 96 (SEQ ID NO:158). Figure 98 (SEQ ID NO:160), Figure 100 (SEQ ID NO:162), Figure 
102 (SEQ ID NO: 170), Figure 104 (SEQ ID NO: 180), Figure 106 (SEQ ID NO: 189), Figure 108 (SEQ ID 
NO: 194), Figure 110 (SEQ ID NO: 196), Figure 1 12 (SEQ ID NO: 198), Figure 1 14 (SEQ ID NO:203), Figure 
116 (SEQ ID NO:210), Figure 118 (SEQ ID NO:212), Figure 120 (SEQ ID NO:214), Figure 122 (SEQ ID 
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NO:216), Figure 124 (SEQ ID NO:218), Figure 126 (SEQ ID NO:220), Figure 128 (SEQ ID NO:225), Figure 
130 (SEQ ID NO:227), Figure 132 (SEQ ID NO:229), Figure 134 (SEQ ID NO:234), Figure 136 (SEQ ID 
NO:236). Figure 138 (SEQ ID NO:243), Figure 140 (SEQ ID NO:248), Figure 142 (SEQ ID NO:253), Figure 
144 (SEQ ID NO:260), Figure 146 (SEQ ID NO:265), Figure 148 (SEQ ID NO:267), Figure 150 (SEQ ID 
NO:269), Figure 152 (SEQ ID NO:271), Figure 154 (SEQ ID NO:273), Figure 156 (SEQ ID NO:275), Figure 
158 (SEQ ID NO:277), Figure 160 (SEQ ID NO:282), Figure 162 (SEQ ID NO:287), Figure 164 (SEQ ID 
NO:292), Figure 166 (SEQ ID NO:297), Figure 168 (SEQ ID NO:302), Figure 170 (SEQ ID NO:304), Figure 
172 (SEQ ID NO:306), Figure 174 (SEQ ID NO:308), Figure 176 (SEQ ID NO:310). Figure 178 (SEQ ID 
NO:315), Figure 180 (SEQ ID NO:317), Figure 182 (SEQ ID NO:322), Figure 184 (SEQ ID NO:324), Figure 
186 (SEQ ID NO:326), Figure 188 (SEQ ID NO:328), Figure 190 (SEQ ID NO:330), Figure 192 (SEQ ID 
NO:332), Figure 194 (SEQ ID NO:334), Figure 196 (SEQ ID NO:336), Figure 198 (SEQ ID NO:338), Figure 
200 (SEQ ID NO:340). Figure 202 (SEQ ID NO:347), Figure 204 (SEQ ID NO:352), Figure 206 (SEQ ID 
NO:354), Figure 208 (SEQ ID NO:356), Figure 210 (SEQ ID NO:358). Figure 212 (SEQ ID NO:364), Figure 
214 (SEQ ID NO:366), Figure 216 (SEQ ID NO:372), Figure 218 (SEQ ID NO:374), Figure 220 (SEQ ID 
NO:376), Figure 222 (SEQ ID NO:378), Figure 224 (SEQ ID NO:383), Figure 226 (SEQ ID NO:385), Figure 
228 (SEQ ID NO:390>, Figure 230 (SEQ ID NO:395), Figure 232 (SEQ ID NO:397), Figure 234 (SEQ ID 
NO:402), Figure 236 (SEQ ID NO:406), Figure 238 (SEQ ID NO:410), Figure 240 (SEQ ID NO:415), Figure 
242 (SEQ ID NO:423), Figure 244 (SEQ ID NO:429) and Figure 246 (SEQ ID NO:431). 

13. Isolated PRO polypeptide having at least 80% sequence identity to the amino acid sequence 
encoded by a nucleic acid molecule deposited under any ATCC accession number shown in Table 2. 

14. A chimeric molecule comprising a polypeptide according to Claim 1 2 fused to a heterologous 
amino acid sequence. 

15. The chimeric molecule of Claim 14 wherein said heterologous amino acid sequence is an 
epitope tag sequence. 

16. The chimeric molecule of Gaim 14 wherein said heterologous amino acid sequence is a Fc 
region of an immunoglobulin. 

17. An antibody which specifically binds to a PRO polypeptide according to Claim 12. 

18. The antibody of Claim 17 wherein said antibody is a monoclonal antibody. 

19. The antibody of Claim 17 wherein said antibody is a humanized antibody. 

20. The antibody of Claim 17 wherein said antibody is an antibody fragment. 
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21 . An isolated nucleic acid which has at least 80% sequence identity to a nucleic acid sequence 
selected from the group consisting of that shown in Figure 1 (SEQ ID NO:3). Figure 3 (SEQ ID NO:5), Figure 
5 (SEQ ID NO:7), Figure 7 (SEQ ID NO:9), Figure 9 (SEQ ID NO:ll), Figure 11 (SEQ ID NO: 16), Figure 
13 (SEQ ID NO:21), Figure 15 (SEQ ID NO:23), Figure 17 (SEQ ID NO:28), Figure 19 (SEQ ID NO:30), 
Figure 21 (SEQ ID NO:32), Figure 23 (SEQ ID NO:40), Figure 25 (SEQ ID NO:42), Figure 27 (SEQ ID 
NO:49), Figure 29 (SEQ ID NO:51), Figure 3 1 (SEQ ED NO:53), Figure 33 (SEQ ID NO:55), Figure 35 (SEQ 
ID NO:57), Figure 37 (SEQ ID NO:62), Figure 39 (SEQ ID NO:67), Figure 41 (SEQ ID NO:69), Figure 43 
(SEQ ID NO:71), Figure 45 (SEQ ID NO:76), Figure 47 (SEQ ID NO:78). Figure 49 (SEQ ID NO:83), Figure 
51 (SEQ ID NO:85), Figure 53 (SEQ ID NO:87), Figure 55 (SEQ ID NO:94), Figure 57 (SEQ ID NO:99), 
Figure 59 (SEQ ID NO: 101), Figure 61 (SEQ ID- NO: 103), Figure 63 (SEQ ID NO: 1 10), Figure 65 (SEQ ID 
NO:115). Figure 67 (SEQ ID NO:l 17), Figure 69 (SEQ ID NO:122), Figure 71 (SEQ ID NO: 127), Figure 73 
(SEQ ID NO:129), Figure 75 (SEQ ID NO:131), Figure 77 (SEQ ID NO:133), Figure 79 (SEQ ID NO: 135), 
Figure 81 (SEQ ID NO:137), Figure 83 (SEQ ID NO:139). Figure 85 (SEQ ID NO:141), Figure 87 (SEQ ID 
NO: 143), Figure 89 (SEQ ID NO: 145), Figure 91 (SEQ ID NO: 147), Figure 93 (SEQ ID NO: 152), Figure 95 
(SEQ ID NO: 157), Figure 97 (SEQ IDNO:159), Figure 99 (SEQ ID NO: 161), Figure 101 (SEQ ID NO: 169), 
Figure 103 (SEQ ID NO: 179), Figure 105 (SEQ ID NO: 188), Figure 107 (SEQ ID NO: 193), Figure 109 (SEQ 
ID NO:195), Figure 111 (SEQ ID NO:197), Figure 113 (SEQ ID NO:202), Figure 115 (SEQ ID NO:209), 
Figure 1 17 (SEQ ID NO:2U), Figure 1 19 (SEQ ID NO:213). Figure 121 (SEQ ID NO:215), Figure 123 (SEQ 
ID NO:217), Figure 125 (SEQ ID NO:219), Figure 127 (SEQ ID NO:224), Figure 129 (SEQ ID NO:226), 
Figure 131 (SEQ ID NO:228), Figure 133 (SEQ ID NO:233), Figure 135 (SEQ ID NO:235), Figure 137 (SEQ 
ID NO:242), Figure 139 (SEQ ID NO:247), Figure 141 (SEQ ID NO:252), Figure 143 (SEQ ID NO:259), 
Figure 145 (SEQ ID NO:264), Figure 147 (SEQ ID NO:266), Figure 149 (SEQ ID NO:268), Figure 151 (SEQ 
ID NO:270). Figure 153 (SEQ ID NO:272), Figure 155 (SEQ ID NO:274), Figure 157 (SEQ ID NO:276), 
Figure 159 (SEQ ID NO:28l), Figure 161 (SEQ ID NO:286), Figure 163 (SEQ ID NO:291), Figure 165 (SEQ 
ID NO:296), Figure 167 (SEQ ID NO:301), Figure 169 (SEQ ID NO:303), Figure 171 (SEQ ID NO:305), 
Figure 173 (SEQ ID NO:307), Figure 175 (SEQ ID NO:309), Figure 177 (SEQ ID NO:314), Figure 179 (SEQ 
ID NO:3I6), Figure 181 (SEQ ID NO:321), Figure 183 (SEQ ID NO:323), Figure 185 (SEQ ID NO:325), 
Figure 187 (SEQ ID NO:327), Figure 189 (SEQ ID NO:329). Figure 191 (SEQ ID NO:331), Figure 193 (SEQ 
ID NO:333), Figure 195 (SEQ ID NO:335), Figure 197 (SEQ ID NO:337), Figure 199 (SEQ ID NO:339), 
Figure 201 (SEQ ID NO:346), Figure 203 (SEQ ID NO:351), Figure 205 (SEQ ID NO:353), Figure 207 (SEQ 
ID NO:355), Figure 209 (SEQ ID NO:357), Figure 21 1 (SEQ ID NO:363), Figure 213 (SEQ ID NO:365), 
Figure 215 (SEQ ID NO:371), Figure 217 (SEQ ID NO:373), Figure 219 (SEQ ID NO:375), Figure 221 (SEQ 
ID NO:377), Figure 223 (SEQ ID NO:382), Figure 225 (SEQ ID NO:384), Figure 227 (SEQ ID NO:389), 
Figure 229 (SEQ ID NO:394), Figure 231 (SEQ ID NO:396), Figure 233 (SEQ ED NO:401), Figure 235 (SEQ 
ID NO:405), Figure 237 (SEQ ID NO:409), Figure 239 (SEQ ID NO:414), Figure 241 (SEQ ID NO:422). 
Figure 242 (SEQ ID NO:428) and Figure 245 (SEQ ID NO:430). 
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22. An isolated nucleic acid which has at least 80% sequence identity to the full-length coding 
sequence of a nucleotide sequence selected from the group consisting of that shown in Figure 1 (SEQ ID NO: 3), 
Figure 3 (SEQ ID NO:5), Figure 5 (SEQ ID NO:7) f Figure 7 (SEQ ID NO:9), Figure 9 (SEQ ID NO: 11), 
Figure 11 (SEQ ID NO: 16), Figure 13 (SEQ ID NO:21), Figure 15 (SEQ ID NO:23), Figure 17 (SEQ ID 
NO:28), Figure 19 (SEQ ID NO:30), Figure 21 (SEQ ID NO:32), Figure 23 (SEQ ID NO:40), Figure 25 (SEQ 
ID NO:42), Figure 27 (SEQ ID NO:49), Figure 29 (SEQ ID NO:51), Figure 31 (SEQ ID NO:53), Figure 33 
(SEQ ID NO:55), Figure 35 (SEQ ID NO:57), Figure 37 (SEQ ID NO:62), Figure 39 (SEQ ID NO:67), Figure 
41 (SEQ ID NO:69), Figure 43 (SEQ ID NO:71), Figure 45 (SEQ ID NO:76), Figure 47 (SEQ ID NO:78), 
Figure 49 (SEQ ID NO:83), Figure 51 (SEQ ID NO:85). Figure 53 (SEQ ID NO:87), Figure 55 (SEQ ID 
NO:94), Figure 57 (SEQ ID NO:99), Figure 59 (SEQ ID NO:10l), Figure 61 (SEQ ID NO:103), Figure 63 
(SEQ ID NO: 1 10), Figure 65 (SEQ ID NO: 1 15), Figure 67 (SEQ ID NO: 1 17), Figure 69 (SEQ ID NO:122), 
Figure 71 (SEQ ID NO:127), Figure 73 (SEQ ID NO:129), Figure 75 (SEQ ID NO: 131), Figure 77 (SEQ ID 
NO: 133), Figure 79 (SEQ ID NO: 135), Figure 81 (SEQ ID NO:137), Figure 83 (SEQ ID NO:139). Figure 85 
(SEQ ID NO:141), Figure 87 (SEQ ID NO:143), Figure 89 (SEQ ID NO:145), Figure 91 (SEQ ID NO:147), 
Figure 93 (SEQ ID NO: 152), Figure 95 (SEQ ID NO: 157). Figure 97 (SEQ ID NO: 159), Figure 99 (SEQ ID 
NO:161), Figure 101 (SEQ ID NO:169), Figure 103 (SEQ ID NO:179), Figure 105 (SEQ ID NO:188), Figure 
107 (SEQ ID NO: 193), Figure 109 (SEQ ID NO: 195), Figure 111 (SEQ ID NO: 197), Figure 113 (SEQ ID 
NO:202), Figure 1 15 (SEQ ID NO:209), Figure 1 17 (SEQ ID NO:21 1). Figure 119 (SEQ ID NO:213), Figure 
121 (SEQ ID NO:215), Figure 123 (SEQ ID NO:217), Figure 125 (SEQ ID NO:219), Figure 127 (SEQ ID 
NO:224), Figure 129 (SEQ ID NO:226), Figure 131 (SEQ ID NO:228), Figure 133 (SEQ ID NO:233), Figure 
135 (SEQ ID NO:235), Figure 137 (SEQ ID NO:242). Figure 139 (SEQ ID NO:247). Figure 141 (SEQ ID 
NO:252), Figure 143 (SEQ ID NO:259), Figure 145 (SEQ ID NO:264), Figure 147 (SEQ ID NO:266). Figure 
149 (SEQ ID NO:268), Figure 151 (SEQ ID NO:270), Figure 153 (SEQ ID NO:272), Figure 155 (SEQ ID 
NO:274), Figure 157 (SEQ ID NO:276). Figure 159 (SEQ ID NO:281), Figure 161 (SEQ ID NO:286), Figure 
163 (SEQ ID NO:291), Figure 165 (SEQ ID NO:296), Figure 167 (SEQ ID NO:30i), Figure 169 (SEQ ID 
NO:303). Figure 171 (SEQ ID NO:305), Figure 173 (SEQ ID NO:307), Figure 175 (SEQ ID NO:309), Figure 
177 (SEQ ID NO:314), Figure 179 (SEQ ID NO:316), Figure 181 (SEQ ID NO:321), Figure 183 (SEQ ID 
NO:323), Figure 185 (SEQ ID NO:325), Figure 187 (SEQ ID NO:327), Figure 189 (SEQ ID NO:329), Figure 
191 (SEQ ID NO:331). Figure 193 (SEQ ID NO:333), Figure 195 (SEQ ID NO:335), Figure 197 (SEQ ID 
NO:337), Figure 199 (SEQ ID NO:339), Figure 201 (SEQ ID NO:346), Figure 203 (SEQ ID NO:351), Figure 
205 (SEQ ID NO:353), Figure 207 (SEQ ID NO:355), Figure 209 (SEQ ID NO:357), Figure 211 (SEQ ID 
NO:363), Figure 213 (SEQ ID NO:365), Figure 215 (SEQ ID NO:371), Figure 217 (SEQ ID NO:373), Figure 
219 (SEQ ID NO:375). Figure 221 (SEQ ID NO:377), Figure 223 (SEQ ID NO:382), Figure 225 (SEQ ID 
NO:384), Figure 227 (SEQ ID NO:389), Figure 229 (SEQ ID NO:394), Figure 231 (SEQ ID NO: 396), Figure 
233 (SEQ ID NO:401), Figure 235 (SEQ ID NO:405), Figure 237 (SEQ ID NO:409), Figure 239 (SEQ ID 
NO:4l4), Figure 241 (SEQ ID NO:422), Figure 242 (SEQ ID NO:428) and Figure 245 (SEQ ID NO:430). 

23 . An isolated extracellular domain of a PRO polypeptide . 
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24. An isolated PRO polypeptide lacking its associated signal peptide. 

25. An isolated polypeptide having at least about 80% amino acid sequence identity to an 
extracellular domain of of PRO polypeptide. 

26. An isolated polypeptide having at least about 80% amino acid sequence identity to a PRO 
polypeptide lacking its associated signal peptide. 

27. An isolated nucleic acid encoding the polypeptide of any one of Claims 23 to 26. 



499 



WO 00/12708 



PCT/US99/20111 



FIGURE 1 

CCAATCGCCCGGTGCGGTGGTGCAGGGTCTCGGGCTAGTC^ISGCGTCCCCGTCTCGGAGAC 
TG CAGACT AAAC CAGT C ATTACTTGTTTC AAGAG CGTT CTGCTAAT CTACACTTTTATTTTC 
TGGATCACTGGCGTTATCCTTCTTGCAGTTGGCATTTGGGGCAAGGTGAGCCTGGAGAATTA 
CTTTTCTCTTTTAAATGAGAAGGCCACCAATGTCCCCTTCGTGCTCATTGCTACTGGTACCG 
TCATTATTCTTTTGGGCACCTTTGGTTGTTTTGCTACCTGCCGAGCTTCTGCATGGATGCTA 
AAACTGTATGCAATGTTTCTGACTCTCGTTTTTTTGGTCGAACTGGTCGCTGCCATCGTAGG 
AT TTGTTTTC AGAC ATGAGATT AAGAACAG CTTTAAGAATAATTATG AGAAGGCTTTGAAGC 
AGT ATAACT C TACAGG AG ATTATAGAAG C CATGC AGTAGACAAGATC C AAAAT ACGTT GCAT 
TG TTGTGG TG T CAC CG ATTATAGAGATT GG ACAGATACTAATT ATTACTC AGAAAAAGGATT 
T CCT AAG AGT TG CTGT AAAC TTGAAG ATT GTACTC CACAGAGAGATGC AG ACAAAGT AAAC A 
AT G AAG GT TG TTTT AT AAAGGTGATGACCATTATAGAGT CAGAAATGGGAGT CGTTG C AGGA 
ATTTCCTTTGGAGTTGCTTGCTTCCAACTGATTGGAATCTTTCTCGCCTACTGCCWCTCTCG 
TG CC AT AA CAAAT AAC CAGTATG AGATAGTGTAACCCAATGT AT CTGT GG G C CT ATTC CT CT 
CT AC CT TT AAGGAC ATTTAGGGT CC C C C CTGTGAATTAGAAAGTTG CT TG G CTGGAG AACTG 
AC AACA CT AC TTACTG ATAG AC CAAAAAACTACA CCAG T AGGTTGATT CAAT CAAGATGT AT 
GTAGAC CTAAAACTACACCAATAGG CTGATT C AATCAAGAT CCGTG CT CG C AGTGGGCTG AT 
T CAAT CAAGATGT ATGTTTGCTATGTTCTAAGTCCACCTTCT AT CCCATTCATGTT AG ATCG 
TTGAAACC CTGTAT C CCTCTGAAAC ACTGGAAGAGCTAGT AAATTGTAAATGAAGT 
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FIGURE 2 

></usr/seqdb2/sst /DNA/Dnaseqs . min/ss . DNA19902 
xsubunit 1 of l, 245 aa, 1 stop, 1 unknown 
><MW: -1, pi: 8.36, NX{S/T): 1 

MAS PSRRLQTKP VI TCFKS VLL I YTF I FWITG VI LLAVGI WGKVSLENYFSLLNEKATNVPF 
VLIATGTVIILLGTFGCFATCRASAWMLKLYAMFLTLVFLVELVAAIVGFVFRHEIKNSFKN 
NYEKALKQYNSTGDYRSHAVDKIQI^LHCCGVTDYRDWTDTNYYSEKGFPKSCCKLEDCTPQ 
RDADKVNNEGCFIKVMTIIESEMGVVAGISFGVACFQLIGIFLAYCXSRAITNNQYEIV 

Important features of the protein: 
Signal peptide: 

amino acids 1-42 

Transmembrane domains: 

amino acids 19-42, 61-83, 92-114, 209-230, 

N-glycosylation site. 

amino acids 134-138 

Tyrosine kinase phosphorylation site. 

amino acids 160-168, 160-169 

N-myristoylation site. 

amino acids 75-81, 78-84, 210-216, 214-220, 226-232 

Prokaryotic membrane lipoprotein lipid attachment site, 
amino acids 69-80, 211-222 



WO 00/12708 PCT/US99/2011I 



FIGURE 3 

CCCACGCGTCCGGCGCCGTGGCCTCGCGTCCATCTTTGCCGTTCTCTCG6ACCTGTCACAAA 
GGAGTCGCGCCGCCGCCGCCGCCCCCTCCCTCCGGTGGGCCCGGGAGGTAGAGAAAGTCAGT 
GCCACAGCCCGACCGCGCTGCTCTGAGCCCTGGGCACGCGGAACGGGAGGGAGTCTGAGGGT 
TGGGGACGTCTGTGAGGGAGGGGAACAGCCGCTCGAGCCTGGGGCGGGCGGACCGGACTGGG 
GCCGGGGTAGGCTCTGGAAAGGGCCCGGGAGAGAGGTGGCGTTGGTCAGAACCTGAGAAACA 
GCCGAGAGGTTTTCCACCGAGGCCCGCGCTTGAGGGATCTGAAGAGGTTCCTAGAAGAGGGT 
GTTCCCTCTTTCGGGGGTCCTCACCAGAAGAC^TTCTTGGGGGTCGCCCTTCTGAGGAGGCT 
GCGGCTAACAGGGCCCAGAACTGCCATTGGATGTCCAGAATCCCCTGTAGTTGATAATGTTG 
GGAATAAG CT CT GC AACTTT CTTTGGCATT CAGTTGTTAAAAACAAATAGGATG CAAATT CC 
TCAACTCCAGGTTATGAAAACAGTACTTGGAAAACTGAAAACTACCTAAMGATCGTCTTTG 
GTTGGGCCGTGTTCTTAGCGAGCAGAAGCCTTGGCCAGGGTCTGTTGTTGACTCTCGAAGAG 
CACATAGCCCACTTCCTAGGGACTGGAGGTGCCGCTACTACCATGGGTAATTCCTGTATCTG 
CCGAG ATGACAGTG GAACAG ATG ACAGTGTTG AC AC CCAACAG C AACAGG CCGAGAAC AGTG 
CAGTACCCACTGCTGACACAAGGAGCCAACCACGGGACCCTGTTCGGCCACCAAGGAGGGGC 
CGAGGACCTCATGAGCCAAGGAGAAAGAAACAAAATGTGGATGGGCTAGTGTTGGACACACT 
GGC^GTAATACGGACTCTTGTAGAT AAGTAAGTAT CTGACT CACGGT CAC CT CCAGTGGAAT 
GAAAAGTGTTCTGCCCGGAACCATGACTTTAGGACTCCTTCAGTTCCTTTAGGACATACTCG 
CCAAGCCTTGTG CT CACAGGGCAAAGGAGAATAT TTTAATGCTC CGCTGATGGCAGAGTAAA 
TGATAAGATTTGATGTTTTTGCTTGCTGTCATCTACTTTGTCTGGAAATGTCTAAATGTTTC 
TGTAGCAGAAAACACGATAAAGCTATGATCTTTATTAGAG 
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FIGURE 4 

MIVFGWAVFIJ^RSIX3QGLLLTLEEHIAHFLGTGGAATTMGNSCICRDDSGTDDSVDTQQQQ 
AENSAVPTADTRSQPRDPVRPPRRGRGPHEPRRKKQNVDGLVLDTLAVIRTLVDKO 

Signal peptide: 

amino acids 1-16 

Casein kinase II phosphorylation site. 

amino acids 22-26, 50-54, 113-117 

N-myristoylation site. 

amino acids 18-24, 32-38, 34-40, 35-41, 51-57 



WO 00/12708 PCT/US99/20U1 

FIGURE 5 

GGCACGAGGCGCTGTCCACCCGGGGGCGTGGGAGTGAGGTACCAGATTCAGCCCATTTGGCC 
CCGACGCCTCTGTTCTCGGAATCCGGGTGCTGCGGATTGAGGTCCCGGTTCCTAACGGACTG 
CAAGATgGAGGAAGGCGGGAACCTAGGAGGCCTGATTAAGATGGTCCATCTACTGGTCTTGT 
CAGGTGCCTGGGGCATGCAAATGTGGGTGACCTTCGTCTCAGGCTTCCTGCTTTTCCGAAGC 
CTTCCCCGACATACCTTCGGACTAGTGCAGAGCAAACTCTTCCCCTTCTACTTCCACATCTC 
CATGGGCTGTGC CTTCAT CAAC CT CTG CAT CTTGGCTT CACAGCATGCTTGGGCT CAGCTCA 
CATTCTGGGAGGCCAG CC AGCTTTACCTG CTGTT CC TG AG C CTTA CG CTGGC CACTGTCAAC 
GCCCGCTGGCTGGAACCC CGCACCACAG CTGCCATGTGGGCCCTGCAAACCGTGGAGAAGGA 
GCGAGGCCTGGGTGGGGAGGTACCAGGCAGCCACCAGGGTCCCGATCCCTACCGCCAGCTGC 
GAGAGAAGGACC CCAAGTACAGTG CTCTC CGCCAGAATTTCTTCCGCTAC CATGGGCTGTCC 
TCTCTTTGCAATCTGGGCTGCGTCCTGAGCAATGGGCTCTGTCTCGCTGGCCTTGCCCTGGA 
AATAAGGAGCCTCTAGCATGGGCCCTGCATGCTAATAAATGCTTCTTCAGAAATGAAAAAAA 
AAAAAAAAAAAA 
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FIGURE 6 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA56107 
<subunit 1 of 1, 231 aa, 1 stop 
<NX(S/T) : 0 

MEEGGNLGGLIKMVHLLVLSGAWGMQMWrFVSGFLLFRSLPRHTFGLVQSKLFPFYFHISM 

GCAFINLCILASQHAWAQLTFWEASQLYLLFLSL 

GLGGEVPGSHQGPDPYRQLREKDPKYSALRQNFFR^ 

Signal peptide: 
amino acids 1-24 

Transmembrane domain: 

amino acids 86-103, 60-75 

Casein kinase II phosphorylation site. 

amino acids 82-86 

Tyrosine kinase phosphorylation site. 

amino acids 144-151 

N-myristoylation site. 

amino acids 4-10, 5-11, 47-53, 170-176, 176-182 

Prokaryotic membrane lipoprotein lipid attachment site. 

amino acids 54-65 

G-protein coupled receptors proteins. 

amino acids 44-85 
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FIGURE 7 

AATT CAGATTTTAAG CC CATTCTG CAGTGGAATTT CATGAACTAG CAAG AGGACACC ATC TT 
CTTGTATTATACAAGAAAGGAGTGTACCTATCACACACAGGGGGAAAAATGCTCTTTTGGGT 
GCTAGGCCT C CTAAT C CTCTGTGGTTTT CTGTGGACTCGTAAAGGAAAACTAAAGATTGAAG 
ACATCAC TGATAAGTACATTTTTAT C ACTGGATGTGAC TCGGGCT TTGGAAACTTGGC AG C C 
AGAACTTTTGAT AAAAAGGGATTTCATG TAAT C G CTG C CTGT CTGACTG AAT CAG GATCAAC 
AGCTTTAAAGGCAGAAACCTCAGAGAGACTTCGTACTGTGCTTCTGGATGTGACCGACCCAG 
AGAATGTCAAGAGGACTGCCCAGTGGGTGAAGAACCAAGTTGGGGAGAAAGGTCTCTGGGGT 
CTGATCAATAATGCTGGTGTTCCCGGCGTGCTGGCTCCCACTGACTGGCTGACACTAGAGGA 
CTACAGAGAACCTATTGAAGTGAACCTGTTTGGACTCATCAGTGTGACACTAAATATGCTTC 
CT TTGGTC AAGAAAG CTC AAGGGAG AG TTATTAATGTCTCCAGTGTTGGAGGTCGC CTTG CA 
AT CGTTGGAGGGGG CTAT ACTCCATCCAAATATGCAGTGGAAGGTTTCAATGACAGCTTAAG 
ACGGGACATGAAAGCTTTTGGTGTGCACGTCTCATGCATTGAACCAGGATTGTTCAAAACAA 
AC TTGGCAGAT CCAGTAAAGGTAATTGAAAAAAAACTC GCCATTTGGG AG CAGCTGT CTCCA 
GACATCAAACAACAATATGGAGAAG GTT AC ATTGAAAAAAGT CT AGACAAACTG AAAGGCAA 
TAAATCCTATGTGAACATGGACCTCTCTCCGGTGGTAGAGTGCATGGACCACGCTCTAACAA 
GTCTCTTCCCTAAGACTCATTATGCCGCTGGAAAAGATGCCAAAATTTTCTGGATACCTCTG 
TC TCACATG C CAGCAGCT TT GC AAGACTTTTTATTGTTGAAACAGAAAGCAGAG CTGGCTAA 
TCCCAAGGCAGTG^SaCTCAGCTAACCACAAATGTCTCCTCCAGGCTATGAAATTGGCCGAT 
TTCAAG AACA CATCTC CTTT TC AACC C C ATTC CTT ATC TG CT C CAACCTGGACTCATTTAGA 
TCGTGCTTATTTGGATTGCAAAAGGGAGTCCCACCATCGCTGGTGGTATCCCAGGGTCCCTG 
CT CAAGTTTT CTTTGAAAAGGAGGGCTGGAATGGTACATCACATAGG CAAGTC CTG CC CTGT 
ATTTAGGCTTTGCCTGCTTGGTGTGATGTAAGGGAAATTGAAAGACTTGCCCATTCAAAATG 
ATCTTTACCGTGGCCTGCCCCATGCTTATGGTCCCC^GCATTTACAGTAACTTGTGAATGTT 
AAGT ATCAT CTCTT AT CTAAATATTAAAAGATAAGTCAACCC AAAAAAAAAAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAAA 
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></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA56406 
xsubunit l of 1, 319 aa, 1 stop 
><MW: 35227, pi; 8.97, NX (S/T) : 3 
MLFWVLGLLILCGFLWTRKGKLKIEDITDK^ 

ESGS TALKAETS ERLRTVLLDVTD PENVKRTAQWVKNQVGEKGLWGL I NNAGVPGVLAPTDW 
LTLED YRE P I EVNL FGL I S VTLNMLP LVKKAQ GRVI NVS S VGGRLAI-VGGGYTPS KYAVEGF 
NDSLRRDMKAFGVHVSCIEPGLFKTNI^PVKVIEKKLAIWEQLSPDIKQQYGEGYIEKSLD 

KLKG^SYVNMDLSPWECMDHALTSLFPKTHYAAGKDAKIFWIPLSHMPAALQDFLLLKQ^ 
AELANPKAV 

Important features of the protein: 
Signal peptide: 

amino acids 1-17 

Transmembrane domain: 

amino acids 136-152 

N-glycosylation sites. 

amino acids 161-163 , 187-190 and 253-256 

Glycosaminoglycan attachment site. 

amino acids 3 9-42 



N-myristoylation sites. 

amino acids 36-41, 42-47, 108-113, 166-171, 198-203 and 207-212 
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EIG URE 9 

GCGGGCTGTTGACGGCGCTGCGAIGGCTGCCTGCGAGGGCAGGAGAAGCGGAGCTCTCGGTT 
CCTCTCAGTCGGACTTCCTGACGCCGCCAGTGGGCGGGGCCCCTTGGGCCGTCGCCACCACT 
GTAGTCATGTACCCACCGCCGCCGCCGCCGCCTCATCGGGACTTCATCTCGGTGACGCTGAG 
CTTTGGCGAGAGCTATGACAACAGCAAGAGTTGGCGGCGG CG CTCGTGCTGGAGGAAATGGA 
AG CAACTGTCGAGATTGCAG CGGAATATGATT CTCTTC CT CC TTG C CTTT CTGCTTTT CTGT 
GGACT C CT CTT CTACATC AACTTGGCTGACCATTGGAAAG CT CTGG CTTT CAGG CTAGAGGA 
AGAG CAGAAGATGAGG CCAG AAATTGCTGGGTT AAAAC CAGC AAAT C C AC CCGTCTTACCAG 
CTCCTCAGAAGGCGGACACCGACCCTGAGAACTTACCTGAGATTTCGTCACAGAAGACACAA 
AGACACATCCAGCGGGGACCACCTCACCTGCAGATTAGACCCCCAAGCCAAGACCTGAAGGA 
TGGGACCCAGGAGGAGGCCACAAAAAGGCAAGAAGCCCCTGTGGATCCCCGCCCGGAAGGAG 
ATCCGCAGAGGACAGTCATCAGCTGGAGGGGAGCGGTGATCGAGCCTGAGCAGGGCACCGAG 
CTCCCTTCAAGAAGAGCAGAAGTGCCCACCAAGCCTCCCCTGCCACCGGCCAGGACACAGGG 
CA CACC AG TGCATCTGAA CTAT CG C CAGAAGGGCGT GATT GACGT CTTCCTGCATG CATGG A 
AAGGAT AC CGCAAGTTTG CATGGGGCCATGACGAGCTGAAGCCTGTGTCCAGGT CCTTCAGT 
G AGT GGTTTGG C CT CGGT CT C ACACTGAT CGACG CGCTGG ACAC CATGTGGATCTTGGGTCT 
GAGGAAAGAATTTGAGGAAGCCAGGAAGTGGGTGTCGAAGAAGTTACACTTTGAAAAGGACG 
TGGACGTCAACCTGTTTGAGAGCACGATCCGCATCCTGGGGGGGCTCCTGAGTGCCTACCAC 
CTGTCTGGGGACAGCCTCTTCCTGAGGAAAGCTGAGGATTTTGGAAATCGGCTAATGCCTGC 
CTTCAGAAC AC CAT C CAAGATTCCTTACTC GG ATGTGAACAT CGGTACTGGAGTTG CCCACC 
CGCCACGGTGGACCTCCGACAGCACTGTGGCCGAGGTGACCAGC ATTCAGCTGGAGTT CCGG 
GAGCTCTC CCGTCTCACAGGGG AT AAGAAGTTT CAG GAGG CAGTGGAG AAGGTGACACAG CA 
CATCCACGGCCTGTCTGGGAAGAAGGATGGGCTGGTGCCCATGTTCATCAATACCCACAGTG 
GCCTCTT CAC C CAC C TGGGCGTATTCACG CTGGG CG CCAG GG C CGACAGCTACTATGAGTAC 

CTGCTGAAGCAGTGGATCCAGGGCGGGAAGCAGGAGACACAGCTGCTGGAAGACTACGTGGA 
AGCCATCGAGGGTGTCAGAACGCACCTGCTGCGGCACTCCGAGCCCAGTAAGCTCACCTTTG 
TGGGGGAGCTTGCCCACGGCCGCTTCAGTGCCAAGATGGACCACCTGGTGTGCTTCCTGCCA 
GGGACGCTGGCTCTGGGCGTCTACCACGGCCTGCCCGCCAGCCACATGGAGCTGGCCCAGGA 
GCTCATGGAGACTTGTTACCAGATGAACCGGCAGATGGAGACGGGGCTGAGTCCCGAGATCG 
TGCACTTCAACCTTTACCCCCAGCCGGGCCGTCGGGACGTGGAGGTCAAGCCAGCAGACAGG 
CAC AAC CTGC TGCGGC CAGAGAC CGTGGAGAGCCTGTTCTACCTGT ACCG CGTCAC AGGGGA 
CCGCAAATAC CAGGACTGGGGCTGGGAGATT CTGCAGAGCTT CAGC CGATTC ACACGGGTC C 
CCTCGGGTGGCTATTCTTCCATCAACAATGTCCAGGATCCTCAGAAGCCCGAGCCTAGGGAC 
AAGATGGAGAGCTTCTTCCTGGGGGAGACGCTCAAGTATCTGTTCTTGCTCTTCTCCGATGA 
CCCAAACCTGCTCAGCCTGGACGCCTACGTGTTCAACACCGAAGCCGACCCTCTGCCTATCT 
GGACCCCTGCCTAGGGTGGATGGCTGCTGGTGTGGGGACTTCGGGTGGGCAGAGGCACCTTG 
CTGGGTCTGTGGC^TTTTCCAAGGGCCCACGTAGCACCGGC^ACCGCCAAGTGGCCCAGGCT 
CTGAACTGGCTCTGGGCTCCTCCTCGTCTCTGCTTTAATCAGGACACCGTGAGGACAAGTGA 
GGCCGTCAGTCTTGGTGTGATGCGGGGTGGGCTGGGCCGCTGGAGCCTCCGCCTGCTTCCTC 
CAGAAGACACGAATCATGACTCACGATTGCTGAAGCCTGAGCAGGTCTCTGTGGGCCGACCA 
GAGGGGGGCTTCGAGGTGGTCCCTGGTACTGGGGTGACCGAGTGGACAGCCCAGGGTGCAGC 
TCTGCCCGGGCTCGTGAAGCCTCAGATGTCCCCAATCCAAGGGTCTGGAGGGGCTGCCGTGA 
CTCCAGAGGCCTGAGGCTCCAGGGCTGGCTCTGGTGTTTACAAGCTGGACTCAGGGATCCTC 
CTGGCCGCCCCGCAGGGGGCTTGGAGGGCTGGACGGCAAGTCCGTCTAGCTCACGGGCCCCT 
CCAGTGGAATGGGTCTTTTCGGTGGAGATAAAAGTTGATTTGCTCTAACCGCAA 
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FIGURE 10 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA5652 9 
xsubunit 1 of 1, 699 aa, 1 stop 
><MW: 79553, pi: 7.83, NX{S/T): 0 

MAACEGRRSGALGSSQSDFLTPPVGGAPWAVATTVVMYPPPPPPPHRDFISVTLSFGESYDN 
SKSWRRRSCWRKWKQLSRLQRNMILFUIiAFLLFCGLLFYINIjADHW 

IAGLKPANPPVLPAPQKADTDPENLPEISSQKTQRHIQRGPPHLQIRPPSQDLKDGTQEEAT 
KRQEAPVDPRPEGDPQRTVISWRGAVIEPEQGTELPSRRAEVPTKPPLPPARTQGTPVHLNY 
RQKGVIDVFLHAWKGYRKFAWGHDELKPVSRSFSEWFGLGLTLIDALDTMWILGLRKEFEEA 
RKWSKKLHFEKDVDVNLFESTIRILGGLLSAYHLSGDSLFLRKAEDFGNRLMPAFRTPSKI 
PYSDVNIGTGVAHPPRWTSDSTVAEVTSIQLEFRELSRLTGDKKFQEAVEKVTQHIHGLSGK 
KDGLVPMF INTHSGLFTHLGVFTLGARADS YYEYLLKQWI QGGKQETQLLEDYVEAIEGVRT 
HLLRHS E P SKLTFVGE LAHGR F S AKMDHL VCFL P GTLALGVYHGL PASHM E LAQ ELMET CYQ 
MNRQMETGLSPEIVHFNLYPQPGRRDVEVKPADRHNIJ.RPETVESLFYLYRVTGDRKYQDWG 
WEILQSFSRFTRVPSGGYSSINNVQDPQKPEPRDKMESFFLGETLKYLFLLFSDDPNLLSLD 
AYVFNTEAHPLPIWTPA 

Important features of the protein: 
Transmembrane domain: 

amino acids 21-40 and 84-105 (type II) 
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FIGURE 11 

GGCGCCGCGTAGGCCCGGGAGGCCGGGCCGGCCGGGCTGCGAGCGCCTGCCCCATGCGCCGC 
CGCCTCTCCGCACGATGTTCCCCTCGCGGAGGAAAGCGGCGCAGCTGCCCTGGGAGGACGGC 
AGGTCCGGGTTGCTCTCCGGCGGCCTCCCTCGGAAGTGTTCCGTCTTCCACCTGTTCGTGGC 
CTGCCTCTCGCTGGGCTTCTTCTCCCTACTCTGGCTGCAGCTCAGCTGCTCTGGGGACGTGG 
CCCGGGCAGTCAGGGGACAAGGGCAGGAGACCTCGGGCCCTCCCCGTGCCTGCCCCCCAGAG 
CCGCCCCCTGAGCACTGGGAAGAAGACGCATCCTGGGGCCCCCACCGCCTGGCAGTGCTGGT 
GCCCTTCCGCGAACGCTTCGAGGAGCTCCTGGTCTTCGTGCCCCACATGCGCCGCTTCCTGA 
GCAGGAAGAAGATCCGGCACCACATCTACGTGCTCAACCAGGTGGACCACTTCAGGTTCAAC 
CGGGCAGCG CTC AT CAAC GTGG G C TT CCTGGAGAGCAGCAACAGCACGG ACT ACATTG CCAT 
GCACGACGTTGACCTGCTCCCTCTCAACGAGGAGCTGGACTATGGCTTTCCTGAGGCTGGGC 
CCTTCCACGTGGCCTCCCCGGAGCTCCACCCTCTCTACCACTACAAGACCTATGTCGGCGGC 
ATCCTGCTGCTCTCCAAGCAGCACTACCGGCTGTGCAATGGGATGTCCAACCGCTTCTGGGG 
CTGGGGCCGCGAGGACGACGAGTTCTACCGGCGCATTAAGGGAGCTGGGCTCCAGCTTTTCC 
GC CCCT CGGGAAT CACAACTGGGTACAAGACATTT C GCCACCTGCATG AC CC AG CCTGGC GG 
AAGAGGGAC CAGAAGCGC AT CG CAGCTCAAAAACAGGAGCAG TTCAAGGTGGACAGGGAGGG 
AGGCCTGAACACTGTGAAGTACCATGTGGCTTCCCGCACTGCCCTGTCTGTGGGCGGGGCCC 
CCTGCACTGTCCTCAACATCATGTTGGACTGTGACAAGACCGCCACACCCTGGTGCACATTC 
AG CTg&GCTGGATG GACAGT GA GG AAGC CTGT AC C T ACAGGC CAT ATTGCT CAGGCTCAGGA 
CAAGGCCTCAGGTCGTGGGCCCAGCTCTGACAGGATGTGGAGTGGCCAGGACCAAGACAGCA 
AG CTACGC AATT GCAGCCAC CCGGC CGC CAAGGCAGG C TTGGGCTGGGC CAGGACACGTGGG 

GTGCCTGGGACGCTGCTTGCCATGCACAGTGATCAGAGAGAGGCTGGGGTGTGTCCTGTCCG 
GGACCCCCCCTGCCTTCCTGCTCACCCTACTCTGACCTCCTTCACGTGCCCAGGCCTGTGGG 
TAGTGGGGAGGGCTGAACAGGAC^CCTCTCATCACCCrACrCTGACCTCCTTCACGTGCCC 
AGGCCTGTGGGTAGTGGGGAGGGCTGAACAGGACAACCTCTCATCACCCCCAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 12 

></usr/seqdb2/sst/DNA/Dnaseqs . rain/ss . DNA56531 
xsubunit 1 of 1, 327 aa r 1 stop 
><MW: 37406, pi: 9.30, NX{S/T) : 1 

MFPSRRKAAQLPWEDGRSGLLSGGLPRKCSVFHLFVACLSLGFFSLLWLQLSCSGDVARAVR 

GQGQETSGPPRACPPEPPPEHWEEDASWGPHRLAVLWFRERFEELLVFVPHMRRFLSRKKI 

RHHIYVLNQVDHFRFNRAALINVGFLESSNSTDYIAMHDVDLLPLNEELJ3YGFPEAGPFHV 

SPELHPLYHYKTYVGGILLLSKQHYRLCNGMSNRFWGWGREDDEFYRRIKGAGLQLFRPSGI 

TTGYKT FRHLHD PAWRKRDQKR I AAQKQEQFKVDREGGLNTVKYHVAS RTALS VGGAP CTVL 

NIMLDCDKTATPWCTFS 

Signal peptide: 
amino acids 1-42 

Transmembrane domain: 

amino acids 29-49 (type II) 

N-glycosylation site. 

amino acids 154-158 

CAMP- and cGMP- dependent protein kinase phosphorylation site. 

amino acids 27-31 

Tyrosine kinase phosphorylation site. 

amino acids 226-233 

N-myristoylation site. 

amino acids 19-25, 65-71, 247-253, 285-291, 303-309, 304-310 
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FIGURE 13 

CAATGTTTGCCTATCCACCTCCCCCAAGCCCCTTTACCTATGCTGCTGCTAACGCTGCTGCT 
GCTGCTGCTGCTGCTTAAAGGCTCATGCTTGGAGTGGGGACTGGTCGGTGCCCAGAAAGTCT 
CTTCTGCCACTGACGCCCCCATCAGGGATTGGGCCTTCTTTCCCCCTTCCTTTCTGTGTCTC 
CTGCCTCATCGGCCTGCCATGACCTGCAGCCAAGCCCAGCCCCGTGGGGAAGGGGAGAAAGT 
GGGGGATGGCTAAGAAAGCTGGGAGATAGGGAACAGAAGAGGGTAGTGGGTGGGCTAGGGGG 
GCTGCCTTATTTAAAGTGGTTGTTTATGATTCTTATACTAATTTATACAAAGATATTAAGGC 
C C TGTT CATTAAGAAATTGTT CCCTT CC CCTGTGTT CAATGTTTG TAAAGATTG TT CT GTGT 
AAATATGTCTTTATAATAAACAGT TAAAAGCTG AAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 14 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA56862 
oubunit l of l, 73 aa, i stop 
<MW: 7879, pi: 7.21, NX (S/T) : 0 

MLLLTLLLLLLLLKGSCLEWGLVGAQKVSSATDAPIRDWAFFPPSFLCLLPHRPAMTCSQAQ 
PRGEGEKVGDG 



Important features: 
Signal peptide: 

amino acids 1-15 

Growth factor and cytokines receptors family: 

amino acids 3-18 
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FIGURE 15 

GGGACCCATGCGGCCGTGACCCCCGGCTCCCTAGAGGCCCAGCGCAGCCGCAGCGGACAAAG 
GAGCATGTCCGCGCCGGGGAAGGCCCGTCCTCCGGCCGCCATAAGGCTCCGGTCGCCGCTGG 
GCCCGCGCCGCGCTCCTGCCCGCCCGGGCTCCGGGGCGGCCCGCTAGGCCAGTGCGCCGCCG 
CTCGCCCCGCAGGCCCCGGCCCGCAGCATGGAGCCACCCGGACGCCGGCGGGGCCGCGCGCA 
GCCGCCGCTGTTGCTGCCGCTCTCGCTGTTAGCGCTGCTCGCGCTGCTGGGAGGCGGCGGCG 
GCGGCGGCGCCGCGGCGCTGCCCGCCGGCTGCAAGCACGATGGGCGGCCCCGAGGGGCTGGC 
AGGGCGGCGGGCGCCGCCGAGGGCAAGGTGGTGTGCAGCAGCCTGGAACTCGCGCAGGTCCT 
GCCCC CAGAT ACTC TG C C CAACCG CACGG T CA C C CTGATT CTGAGT AACAATAAGATATCCG 

AGCTGAAGAATGGCTCATTTTCTGGGTTAAGTCTCCTTGAAAGATTGGACCTCCGAAACAAT 
CTTATTAGTAGTATAGATCCAGGTGCCTTCTGGGGACTGTCATCTCTAAAAAGATTGGATCT 
GACAAACAAT CGAATAGG ATGTCTGAAT GCAG AC ATATTTCGAGGACT CAC CAATCTGGTTC 
GGCTAAACCTTTCGGGGAATTTGTTTTCTTCATTATCTCAAGGAACTTTTGATTATCTTGCG 
TCATTACGGTCTTTGGAATTCCAGACTGAGTATCTTTTGTGTGACTGTAACATACTGTGGAT 
GCATCGCTG GGT AAAGGAGAAG AACATCACGGTACG GGATACCAGGTGTG TTTAT CCT AAGT 
CACTGCAGGCCCAACCAGTCACAGGCGTGAAGCAGGAGCTGTTGACATGCGACCCTCCGCTT 
GAATTGCCGTCTTTCTACATGACTCCATCTCATCGCCAAGTTGTGTTTGAAGGAGACAGCCT 
T C CTTT CC AG TGCATGGCTTCATATATTGAT CAGGACATG CAAGTGTTGT GGTAT CAGGATG 

GGAGAATAGTTGAAACCGATGAATCGCAAGGTATTTTTGTTGAAAAGAACATGATTCACAAC 
TGCTCCTTGATTGCAAGTGCCCTAACCATTTCTAATATTCAGGCTGGATCTACTGGAAATTG 
GGGCTGTCATGTCCAGACCAAACGTGGGAATAATACGAGGACTGTGGATATTGTGGTATTAG 
AGAGTTCTGCACAGTACTGT C CT CCAGAGAGGGT GGTAAACAACAAAGGTGACTTC AGATGG 
CC CAGAACATTGG C AG GC ATTACTGCAT ATCTG CAG TGTACGCGGAACACCC ATG GCAGTGG 
GATAT ATCCCGGAAAC CCACAGGATGAGAG AAAAGCTTGG CGCAGATG TGATAGAGGTGGCT 
TTTGGGCAGATGATGATTATTCTCGCTGTCAGTATGCAAATGATGTCACTAGAGTTCTTTAT 
ATGT TTAATC AG ATGCCC CT CAATCTTA C CAATGCCGTGGCAACAGCT CGACAGTTA CTGGC 
TTA<^CTGTGGAAGCAGCCAACTTTTCTGACAAAATGGATGTTATATTTGTGGCAGAAATGA 
TT GAAAAATTTGGAAGAT TT AC CAAGGAGGAAAAATCAAAAGAGCTAGGTGACGTGATGGTT 
GACATTGCAAGTAACATCATGTTGGCTGATGAACGTGTCCTGTGGCTGGCGCAGAGGGAAGC 
TAAAGCCTGCAGTAGGATTGTGCAGTGTCITCAGCGCATTGCTACCTACCGGCTAGCCGGTG 
GAGCTCACGTTT AT TCAAC^T ATTCACCCAATATTG CTCTGGAAGCTT ATGT CATCAAGT CT 
AC TGGCTTCACGGG GATGAC CTGTACCGTGTTCCAGAAAGTGG C AGCCT CTGAT CGTACAGG 
AC TTTCGGATTATG GGAGGCGGGATCCAGAGGGAAACCTGGATAAG CAGCTGAGCTTT AAGT 
GCAATGTTTCAAATACATTTTCGAGTCTGGCACTAAAGGTATGTTACATTCTGCAATCATTT 
AAGACTATTTACAGT2^^TTAGAATGCTCCAAATGTTCTGCTTCGCAAAATAACCTTATTA 
AAAGATTTTTTTTTGCAGGAAGATAGGTATTATTGCTTTTGCTACTGTTTTAAAGAAAACTA 
AC CAGGAAGAA CTGCATTACGACTTTCAAGGG CCCTAGGCATTTTTGC CTTT GATT CC CTTT 

CTTCACATAAAAATATCAGAAATTACATTTTATAACTGCAGTGGTATAAATGCAAATATACT 
ATTGTTACATGTGAAAAAATTTTATTTGACTTAAAAGTTTATTTATTTGTTTTTTTGCTCCT 
GATTTTAAGACAATAAGATGTTTTCATGGGCCCCTAAAAGTATCATGAGCCTTTGGCACTGC 
GCCTGCC^GCCTAGTGGAGAAGTCAACCCTGAGACCAGGTGTTTAATCAAGCAAGCTGTAT 
AT CAAAATTTTTGGCAGAAAACACAAATATGT CATATATCTTTTTTTAAAAAAAGTATTT CA 
TTGAAG CAAGCAAAATGAAAGCATTTTT AC TGATTTTTAAAATTGGTGCTTTAGATATATTT 
GACTACACTGTATTGAAGCAAATAGAGGAGGCACAACTCCAGCACCCTAATGGAACCACATT 
TTTT TCAC TTAGCTTT CTGT GGGCATGTGT AATTGTATTCTCTGCGGTTT TTAATCTCACAG 
TACTTTATTTCTGTCTTGTCCCTC^WITAATATCACAAACAATATTCCAGTCATTTTAAT^ 

TGCATAATAACTGATCCAACAGGTGTTAGGTGTTCTGGTTTAGTGTGAGCACTCAATAAATA 
TTGAATGAATGAACGAAAAAAAAAAAAAAAA 
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FIGURE 16 

MEPPGRRRGRAQPPLLLPLSLIALLALLGGGGGGGAAALPAGCKHDGRPRGAGRAAGAAEGK 
WCSSLELAQVLPPDTLPNRTVTLILSNNKISELKNGSFSGLSLLERLDLRNNLISSIDPGA 
FWGLSSLKRLDLTNNR I GCLNAD I FRGLTNLVRLNLSGNLFS SL SQGTFD YLAS LRSLEFQT 
EYIJLCDCNILWMHRWVKEKNITVRDTRCVYPKSLQAQPVTGVKQELLTCDPPLELPSFYMTP 
SHRQWFEGDSLPFQCMASYIDQDMQVLWYQDGRIVETDESQGIFVEKNMIHNCSLIASALT 
ISNIQAGSTGNWGCHVQTKRGNNTRTVDIVVLESSAQYCPPERVVNNKGDFRWPRTLAGITA 
YLQCTRNTHGSGIYPGNPQDERKAWRRCDRGGFWADDDYSRCQYANDVTRVLYMFNQMPLNL 
TNAVATARQLLAYTVEAANF.SDKMDVI FVAEMI EKF'GRFTKEEKSKELGDVMVD IASNIMLA 
DERVLWLAQREAJCACSRIVQCLQRIATYRLAGGAHVYSTYSPNIALEAYVIKSTGFTGMTCT 
VFQKVAASDRTGLSDYGRRDPEGNLDKQLSFKCNVSNTFSSLALiCVCYILQSFK'IVlYS 

Signal peptide; 

amino acids 1-33 

Transmembrane domain; 

amino acids 13-40 (type II) 

N-glycosylation site. 

amino acids 81-85, 98-102, 159-163, 206-210, 301-305, 332-336, 
433-437, 453-457, 592-596 

N-myristoylation site. 

amino acids 29-35, 30-36, 31-37, 32-38, 33-39, 34-40, 51-57, 
57-63, 99-105, 123-129, 142-148, 162-168, 317-323, 320-326, 
384-390, 403-409, 554-560 
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FIGURE 17 

GCGTGGGGASGTCTAGGAGCTCGAAGGTGGTGCTGGGCCTCTCGGTGCTGCTGACGGCGGCC 
ACAGTGGCCGGGGTACATGTGAAGCAGCAGTGGGACCAGCAGAGGCTTCGTGACGGAGTTAT 
CAGAGACATTGAGAGGCAAATTCGGAAAAAAGAAAACATTCGTCTTTTGGGAGAACAGATTA 
TTTTGACTGAGCAACTTGAAGCAGAAAG AGAGAAGATGTTATTGGCAAAAGG AT CT CAAAAA 
TCATG^CTTGAATGTGAAATATCTGTTGGACAGACAACACGAGTTTGTGTGTGTGTGTTGAT 
GGAGAGTAGCTTAGTAGTATCTTCATCTTTTTTTTTGGTCACTGTCCTTTTAAACTTGATCA 
AATAAAGGACAGTGGGTCATATAAGTTACTGCTTTCAGGGTCCCTTATATCTGAATAAAGGA 
GTGTGGGCAGACACTTTTTGGAAGAGTCTGTCTGGGTGATCCTGGTAGAAGCCCCATTAGGG 
TCACTGTC CAGT GCTTAGGGTTGTTACT GAGAAG CACTG C CG AGCTTGTGAGAAGGAAGGGA 
TGGATAGT AG CATC CA C CTGAGTAGT CTGATCAG TCGG CATGATGACG AAG CCACGAGAA C A 
T GGACCT CAGAAGGACTGGAGGAAGGTGAAGTGGAGGGAG AGACGCTC CTGAT CGT CGAAT CC 
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FIGURE IS 

MSRSSKWLGLSVLLTAATVAGVHVKQQWDQQRLRDGVIRDIERQIRKKENIRLLGEQI 
EQLEAEREKMLLAKGSQKS 

Signal peptide: 

amino acids 1-21 
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FIGURE 19 

CTGTCGTCTTTGCTTCAGCCGCAGTCGCCACTGGGTGCCTGAGGTGCTCTTACAGCCTGTTC 

CAAGTGTGGCTTAATCCGTCTCCACCACCAGATCTTTCTCCGTGGATTCCTCTGCTAAGACC 

GCTGCCATGCCAGTGACGGTAACCCGCACCACCATCACAACCACCACGACGTCATCTTCGGG 

CCTGGGGTCCCCCATGATCGTGGGGTCCCCTCGGGCCCTGACACAGCCCCTGGGTCTCCTTCGC 

CTGCTGCAGCTGGTGTCTACCTGCGTGGCCTTCTCGCTGGTGGCTAGCGTGGGCGCCTGGAC 

GGGGTCCATGGGCAACTGGTCCATGTTCACCTGGTGCTTCTGCTTCTCCGTGACCCTGATCA 

TCCTCATCGTGGAGCTGTGCGGGCTCCAGGCCCGCTTCCCCCTGTCTTGGCGCAACTTCCCC 

ATCACCTTCGCCTGCTATGCGGCCCTCTTCTGCCTCTCGGCCTCCATCATCTACCCCACCAC 

CTATGTCCAGTTCCTGTCCCACGGCCGTTCGCGGGACCACGCCATCGCCGCCACCTTCTTCT 

CCTGCATCGCGTGTGTGGCTTACGCCACCGAAGTGGCCTGGACCCGGGCCCGGCCCGGCGAG 

ATCACTGGCTATATGGCCACCGTACCCGGGCTGCTGAAGGTGCTGGAGACCTTCGTTGCCTG 

CATCATCTTCGCGTTCATCAGCGACCCCAACCTGTACCAGCACCAGCCGGCCCTGGAGTCGT 

GCGTGGCGGTGTACGCCATCTGCTTCATCCTAGCGGCCATCGCCATCCTGCTGAACCTGGGG 

GAGTGCACCAACGTGCTACCCATCCCCTTCCCCAGCTTCCTGTCGGGGCTGGCCTTGCTGTC 

TGTCCTCCTCTATGCCACCGCCCTTGTTCTCTGGCCCCTCTACCAGTTCGATGAGAAGTATG 

GCGGCCAGCCTCGGCGCTCGAGAGATGTAAGCTGCAGCCGCAGCCATGCCTACTACGTGTGT 

GCCTGGGACCGCCGACTGGCTGTGGCCATCCTGACGGCCATCAACCTACTGGCGTATGTGGC 

TGACCTGGTGCACTCTGCCCACCTGGTTTTTGTCAAGGTCTMGACTCTCCCAAGAGGCTCC 

CGTTCCCTCTCCAACCTCTTTGTTCTTCTTGCCCGAGTTTTCTTTATGGAGTACTTCTTTCC 

TCCGCCTTTCCTCTGTTTTCCTCTTCCTGTCTCCCCTCCCTCCCACCTTTTTCTTTCCTTCC 

CAATTCCTTGCACTCTAACCAGTTCTTGGATGCATCTTCrrCCTTCCCTTTCCTCTTGCTGT 

TTCCTTCCTGTGTTGTTTTGTTGCCCACATCCTGTTTTCACCCCTGAGCTGTTTCTCTTTTT 

CTTTTCTTTCTTTTTTTTTTTTTTTTTTAAGACGGATTCTCACTCTGTGGCCCAGGCTGGAG 

TGCAGTGGTGCGATCTCAGCTCACTGCAACCCCCGCCTCCTGGGTTCAAGCGATTCTCCTCC 

CCCAGCCTCCCAAGTAGCTGGGAGGACAGGTGTGAGCTGCCGCACCCAGCCTGTTTCTCTTT 

TTCCACTCTTCTTTTTTCTCATCTCTTTTCTGGGTTGCCTGTCGGCTTTCTTATCTGCCTGT 

TTTGCAAGCACCTTCTCCTGTGTCCTTGGGAGCCCTGAGACTTCTTTCTCTCCTTGCCTCCA 

CCCACCTCCAAAGGTGCTGAGCTCACATCCACACCCCTTGCAGCCGTCCATGCCACAGCCCC 

CCAAGGGGCCCCATTGCCAAAGCATGCCTGCCCACCCTCGCTGTGCCTTAGTCAGTGTGTAC 

GTGTGTGTGTGTGTGTGTTTGGGGGGTGGGGGGTGGGTAGCTGGGGATTGGGCCCTCTTTCT 

CCCAGTGGAGGAAGGTGTGCAGTGTACTTCCCCTTTAAATTAAAAAACATATATATATATAT 

ATTTGGAGGTCAGTAATTTCCAATGGGCGGGAGGCATTAAGCACCGACCCTGGGTCCCTAGG 

CCCCGCCTGGCACTCAGCXTITGCCAGAGATTGGCTCC^GAATTTTTGCC^USGCTTACAGAACAC 

CCACTGCCTAGAGGCCATCTTAAAGGAAGCAGGGGCTGGATGCCTTTCATCCCAACTATTCT 
CTGTGGTATGAAAAAG 

/ 7/^7 6 
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FIGURE 20 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ SS .DNA58727 
<subunit 1 of 1, 322 aa, 1 stop 
<MW: 35274, pi: 8.57, NX{S/T): 1 

MPVTVTRTTITTTTTSSSGLGSPMIVGSPRALTQPLGLLRLLQLVSTCVAFSLVASVGAWTG 
SMGNWSMFTWCFCFSVTL I IL I VELCGLQARFPLSWRNFP ITFACYAALFCLSAS 1 1 YPTTY 
VQFLSHGRSRDHAIAATFFSCIACVAYATEVAWTRARPGEITGYMATVPGLLKVLETFVACT 
I FAF I S D PNL YQHQ PAL EWC VAVYAI CF I LAAI A I LLNLGE CTNVL PTPFPSFLS GLALLS V 

LLYATALVLWPLYQFDEKYGGQPRRSRDVSCSRSHAYYVCAWDI^LAVAILTAINLLAYVAD 
LVHSAHLVFVKV 

Important features: 
Transmembrane domains: 

amino acids 41-60 (type II), 66-85, 101-120, 137-153, 171-192 
205-226, 235-255 and 294-312 

N-glycosylation site. 

amino acids 66-69 

Glycosaminoglycan attachment site. 

amino acids 18-21 
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FIGURE21 



TOCC " GCTMm " GTAT ™ MTAGMACC ^TTTCACCA TC TTGGCCAGGCTGGTC 

^^ctatgcatttttaagaaattattctg™^^ 

gagagtgatttgt ta 

=AAAGAGCTAGCC7 GC CATC *GAATA 3 r rCAGAAGAGA rGGGQAQCACTACACTCA^TACACTTTGGCCTGAGAA 



AGGA ^~ TAC ^^^ tcgc ^ aaa ^ cct ^cgagg TC gtatttcagcccaaactS 

GAAAGAGCTAGCCAGCCATCAGAATAGTCCAGAAGAGATGGGGAGCACTACACTCACTAC^^ 

AATAGCATGGGAITGGAGGAGCCTGGGGGAACACCACTTCTGCCGACCTGGGCAG^GGCATTGAG^^ 
* A ^raCA< 3 TAG<^TAGAAA G GACA^ 

AACAGATATGGGCAAGCAAAGCC^GGGC^TTGAT^TAATCCTG^ 



TCTGAATCTCCATTGCTTTCTGGGAG<3ACATAATTCACCTGTCCTAGCTTCTTAr^A^^ 



AT^GCCCCTCCCAT^TTCTG^CACTTTOTCCTTTCTCCTCCCGTTTGC^ 
^^^ C ^ TCTCCCCTTTC "^™"CAGGTGAATCTCAGCCCmc^ C C^ 

™^ CCCTATCTCCAGGTAmCC «^^^^ 

T^CTCCTATTCAGACCTCAGCGAGGGCGAACAAGAGGCTCGmTGCAGCAGGAG^G^G 
TCGCGGAAGCCAAGCTCCGAGCATGGTCTTCGGTGGA' ^-AWAeTGOCTGAGCAGTTTGCCA 



AC ^^ CCGGCCTGTGCGC «^ TCCG ^CCTG^ 

^^^ TAGT ^ TC " GCCT ^^TGGGTTGTTGGGCTCCCC« 3 C<:CGGCTGGCCTCC^ 
^GGTGGTGTCCTTAGATGAGGATGAGGCAGAGCCAGAGGAACAGTGACCCACATCATGCCTGGCAGT^ 

tcccccggctgctgccaggggcagagcctctgtgcccaagtgtg^tcaaggo^ccagIaIm 
ggctg^cgcatgtcctgcccccactcccggggcttgccgggggttgcccg^ 

A ^ GG 2f^! GAG I GGGCT ^ 



ATTCACCTCTCCATCGTCTCTAAATCTTCCTCTTTTTTCCTAAAGACA^ 



^CTCATTAGGTGTTTATTTTGTTCTATTTAAGAATTTGTTTTATTA 
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FIGURE 22 

MF^TLSFr^PFAHPFGTVSCEYMLGSPLSSIAQVNLSPFSHPKVHMDPNYCHPSTSLHLCS 

IAWSFTRLLHPPLSPGISQVVKDHVTKPTAMAQGRVAHLIEWKGWSKPSDSPAALESAFSSY 

SDLSEGEQEARFAAGVAEQFAIAEAKIilAWSSVDGEDSTDDSYDEDFAGGMDTDMAGQLPLG 

PHLQDLFTGHRFSRPVRQGSVEPESDCSQTVSPDTLCSSLCSLEDGLLGSPARLASQLLGDE 

LLLAKLPPSRESAFRSLGPLEAQDSLYNSPLTESCLSPAEEEPAPCKDCQPLCPPLTGSWER 
QRQAS DLAS S GWS LDEDEAE PEEQ 

Signal peptide: 

amino acids 1-15 

Casein kinase II phosphorylation site. 

amino acids 123-127, 128-132, 155-159, 162-166, 166-170, 228-232, 
285-289, 324-328 

Tyrosine kinase phosphorylation site. 

amino acids 44-52 

N-myristoylation site. 

amino acids 17-23, 26-32, 173-179 

Prokaryotic membrane lipoprotein lipid attachment site. 

amino acids 11-22 
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FIGURE 23 

GGTTCCTGGGCGCTCTGTTACACAAGCAAGATACAGCCAGCCCCACCTAATTTTGTTTCCCT 

GGCACCCTCCTGCTCAGTGCGACATTGTCACACTTAACCCATCTGTTTTCTCTAATGCACGA 

CAGATTCCTTTCAGACAGGACAACTGTGATATTTCAGTTCCTGATTGTAAATACCTCCTAAG 

CCTGAAGCTTCTGTTACTAGCCATTGTGAGCTTCAGTTTCTTCATCTGCAAAATGGGCATAA 

TACAATCTATTCTTGCCACATCAAGGGATTGTTATTCCTTTAAAAAAAAACCAATACCAAAG 

AAGCCTACAATGTTGGCCTTAGCCAAAATTCTGTTGATTTCAACGTTGTTTTATTCACTTCT 

ATCGGGGAGCCTVTGGAAAAGAAAATCAAGACATAAACAC^ACACAGAACATTGCAGAAGTTT 

TTAAAACAATGGAAAATAAACCTATTTGTTTGGAAAGTGAAGCAAACTTAAACTCAGATAAA 

GAAAATATAACCACCrCAAATCTCAAGGCGAGTCATTCCCCTCCTTTGAATCTACCCAACAA 

CAGCCACGGAATAACAGATTTCTCCAGTAACTCATCAGCAGAGCATTCTTTGGGCAGTCTAA 

AACCCACATCTACCATTTCCACAAGCCCTCCCTTGATCCATAGCTTTGTTTCTAAAGTGCCT 

TGGAATGCACCTATAGCAGATGAAGATCTTTTGCCCATCTCAGCACATCCCAATGCTACACC 

TGCTCTGTCTTCAGAAAACTTCACTTGGTCTTTGGTCAATGACACCGTGAAAACTCCTGATA 

ACAGTTCCATTACAGTTAGCATCCTCTCTTCAGAACCAACTTCTCCATCTGTGACCCCCTTG 

ATAGTGGAACCAAGTGGATGGCTTACCACAAACAGTGATAGCTTCACTGGGTTTACCCCTTA 

TCAAGAAAAAACAACTCTACAGCCTACC1TAAAATTCACCAATAATTCAAAACTCTTTCCAA 

ATACGTCAGATCCCCAAAAAGAAAATAGAAATACAGGAATAGTATTCGGGGCCATTTTAGGT 

GCTATTCTGGGTGTCTCATTGCTTACTCTTGTGGGCTACTTGTTGTGTGGAAAAAGGAAAAC 

GGATTCATTTTCCCATCGGCGACTTTATGACGACAGAAATGAACCAGTTCTGCGATTAGACA 

ATGCACCGGAACCTTATGATGTGAGTTTTGGGAATTCTAGCTACTACAATCCAACTTTGAAT 

GATTCAGCCATGCCAGAAAGTGAAGAAAATGCACGTGATGGCATTCCTATGGATGACATACC 

TCCACTTCGTACTTCTGTA2&SAACTAACAGCAAAAAGGCGTTAAACAGCAAGTGTCATCTA 

CATCCTAGCCTTTTGACAAATTCATCTTTCAAAAGGTTACACAAAATTACTGTCACGTGGAT 

TTTGTCAAGGAGAATCATAAAAGCAGGAGACCAGTAGCAGAAATGTAGACAGGATGTATCAT 

CCAAAGGTTTTCTTTCTTACAATTTTTGGCCATCCTGAGGCATTTACTAAGTAGCCTTAATT 

TGTATTTTAGTAGTATTTTCTTAGTAGAAAATATTTGTGGAATCAGATAAAACTAAAAGATT 

TCACCATTACAGCCCTGCCTCATAACTAAATAATAAAAATTATTCCACCAAAAAATTCTAAA 

ACAATGAAGATGACTCTTTACTGCTCTGCCTGAAGCCCTAGTACCATAATTCAAGATTGCAT 

TTTCTTAAATGAAAATTGAAAGGGTGCTTTTTAAAGAAAATTTGACTTAAAGCTAAAAAGAG 

GACATAGCCCAGAGTTTCTGTTATTGGGAAATTGAGGCAATAGAAATGACAGACCTGTATTC 

TAGTACGTTATAATTTTCTAGATCAGCACACACATGATCAGCCCACTGAGTTATGAAGCTGA 

CAATGACTGCATTCAACGGGGCCATGGCAGGAAAGCTGACCCTACCCAGGAAAGTAATAGCT 

TCTTTAAAAGTCTTCAAAGGTTTTGGGAATTTTAACTTGTCTTAATATATCTTAGGCTTCAA 

TTATTTGGGTGCCTTAAAAACTCAATGAGAATCATGGT 
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FIGURE 24 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA58732 
xsubunit 1 of i, 334 aa, 1 stop 
><MW: 36294, pi; 4.98, NX(S/T) : 13 

MIALAKILLI STLF YSLLSGSHGKENQD INTTQNI AEVFKTMENKP ISLESEANLNSDKENI 
TTSNLKASHSPPLNLPNNSHGITDFSSNSSAEHSLGSLKPTSTISTSPPLIHSFVSBCV^W^ 
PIADEDLLPISAHPNATPALSSENFTWSLVNDTVKTPDNSSITVSILSSEPTSPSVTPLIVE 
PSGWLTTNSDSFTGFTPYQEKTTLQPTLKFTNNSKLFPNTSDPQKENRNTGIVFGAILGAIL 

GVSLLTLVGYLLCGKRKTDSFSHRRLYDDRNEPVLRLDNAPEPYDVSFGNSSYYNPTL^ 
MPESEENARDGI PMDDI PPLRTSV 

Signal peptide: 
amino acids 1-23 

Transmembrane domain: 

amino acids 235-262 

N-glycosylation site. 

amino acids 30-34, 61-65, 79-83, 90-94, 148-152, 155-159, 
163-167, 218-222, 225-229, 298-302, 307-311 
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FIGURE 2S 

AACAGGATCTCCTCTTGCAGTCTGCAGCCCAGGACGCTGATTCCAGCAGCGCCTTACCGCGC 

AGCCCGAAGATTCACTA2SGTGAAAATCGCCTTCAATACCCCTACCGCCGTGCAAAAGGAGG 

AGGCGCGGCAAGACGTGGAGGCCCTCCTGAGCCGCACGGTCAGAACTCAGATACTGACCGGC 

AAGGAGCTCCGAGTTGCCACCCAGGAAAAAGAGGGCTCCTCTGGGAGATGTATGCTTACTCT 

CTTAGGCCTTTCATTCATCTTGGCAGGACTTATTGTTGGTGGAGCCTGCATTTACAAGTACT 

TCATGCCCAAGAGCACCATTTACCGTGGAGAGATGTGCTTTTTTGATrCTGAGGATCCTGCA 

AATTCCCTTCGTGGAGGAGAGCCTAACTTCCTGCCTGTGACTGAGGAGGCTGACATTCGTGA 

GGATGACAACATTGCAATCATTGATGTGCCTGTCCCCAGTTTCTCTGATAGTGACCCTGCAG 

CAATTATTCATGACTTTGAAAAGGGAATGACTGCTTACCTGGACTTGTTGCTGGGGAACTGC 

TATCTGATGCCCCTCAATACTTCTATTGTTATGCCTCCAAAAAATCTGGTAGAGCTCTTTGG 

CAAACTGGCGAGTGGCAGATATCTGCCTCAAACTTATGTGGTTCGAGAAGACCTAGTTGCTG 

TGGAGGAAATTCGTGATGTTAGTAACCTTGGCATCTTTATTTACCAACTTTGCAATAACAGA 

AAGTCCTTCCGCCTTCGTCGCAGAGACCTCTTGCTGGGTTTCAACAAACGTGCCATTGATAA 

ATGCTGGAAGATTAGACACTTCCCCAACGAATTTATTGTTGAGACCAAGATCTGTCAAGAGT 

AAGAGGCAACAGATAGAGTGTCCTTGGTAATAAGAAGTCAGAGATTTACAATATGACTTTAA 

CATTAAGGTTTATGGGATACTCAAGATATTTACTCATGCATTTACTCTATTGCTTATGCTTT 

AAAAAAAGGAAAAAAAAAAAAACTACTAACCACTGCAAGCTCTTGTCAAATTTTAGTTTAAT 

TGGCATTGCTTGTTTTTTGAAACTGAAATTACATGAGTTTCATTTTTTCTTTGCATTTATAG 

GGTTTAGATTTCTGAAAGCAGCATGAATATATCACCTAACATCCTGACAATAAATTCCATCC 

GTTGTTTTTTTTGTTTGTTTGTTTTTTCTTTTCCTTTAAGTAAGCTCTTTATTCATCTTATG 

GTGGAGCAATTTTAAAATTTGAAATATTTTAAATTGTTTTTGAACTTTTTGTGTAAAATATA 

TCAGATCTCAACATTGTTGGTTTCTTTTGTTTTTCATTTTGTACAACTTTCTTGAATTTAGA 

AATTACATCTTTGCAGTTCTGTTAGGTGCTCTGTAATTAACCTGACTTATATGTGAACAATT 

TTCATGAGACAGTCATTTTTAACTAATGCAGTGATTCTTTCTCACTACTATCTGTATTGTGG 

AATGCACAAAATTGTGTAGGTGCTGAATGCTGTAAGGAGTTTAGGTTGTATGAATTCTACAA 

CCCTATAATAAATTTTACTCTATACAAAAAAAAAAAAAAAAAAA 
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FIGIIKF 26 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA58828 
<subunit 1 of 1, 263 aa, 1 stop 

<MW: 29741, pi: 5.74, NX(S/T): 1 

MVKIAFNTPTAVQKEEARQDVEALLSRTVRTQILTGKELRVATQEKEGSSGRCMLTLLGLSF 

ILAGLIVGGACIYKYFMPKSTIYRGEMCFFDSEDPANSLRGGEPNFLPVTEEADIREDDNIA 

IIDVPVPSFSDSDPAAIIHDFEKGMTAYLDLLLGNCYLMPLNTSIVMPPKNLVELFGKLASG 

RYLPQTYWREDLVAVEEIRDVSNLGIFIYQLCNNRKSFRLRRRDLLLGFNKRAIDKCWKIR 
KFPNEF I VETKI CQE 

Type II transmembrane domain: 

amino acids 53-75 

N-glycosylation site. 

amino acids 166-170 

Casein kinase II phosphorylation site. 

amino acids 35-39, 132-136, 134-138 

N-myristoylation site. 

amino acids 66-72, 103-109 

Prokaryotic membrane lipoprotein lipid attachment site. 

amino acids 63-74 



WO 00/12708 



PCT/US99/20111 



FI GURE 27 

GGAGGAGGGAGGGCGGGCAGGCGC CAGCCCAGAGCAGC CCCGGGCAC CAGCACGGACTCTCT 
CTTCCAGCCCAGGTGCCCCCCACTCTCGCTCCATTCGGCGGGAGCACCCAGTCCTGTACGCC 
AAGGAACTGGTCCTGGGGGCACCA2GGTTTCGGCGGCAGCCCCCAGCCTCCTCATCCTTCTG 
TTGCTGCTGCTGGGGTCTGTGCCTGCTACCGACGCCCGCTCTGTGCCCCTGAAGGCCACGTT 
CCTGGAGGATGTGGCGGGTAGTGGGGAGGCCGAGGGCTCGTCGGCCTCCTCCCCGAGCCTCC 
CGCCACCCTGGACCCCGGCCCTCAGCCCCACATCGATGGGGCCCCAGCCCACAACCCTGGGG 
GGCCCATCACCCCCCACCAACTTCCTGGATGGGATAGTGGACTTCTTCCGCCAGTACGTGAT 
GCTGATTGCTGTGGTGGGCTCCCTGGCCTTTCTGCTGATGTTCATCGTCTGTGCCGCGGTCA 
TCACCCGGCAGAAGCAGAAGGCCTCGGCCTATTACCCATCGTCCTTCCCCAAGAAGAAGTAC 
GTGGACCAGAGTGACCGGGCCGGGGGCCCCCGGGCCTTCAGTGAGGTCCCCGACAGAGCCCC 
CGACAGCAGGCCCGAGGAAGCCCTGGATTCCTCCCGGCAGCTCCAGGCCGACATCTTGGCCG 
CCACCCAGAACCTCAAGTCCCCCACCAGGGCTGCACTGGGCGGTGGGGACGGAGCCAGGATG 
GTGGAGGGCAGGGGCGCAGAGGAAGAGGAGAAGG GC AG C CAGGAGGGGGACC AGGAAGT CCA 
GGGACATGGGGT CCCAGTGGAGACACCAGAGGCG CAGG AGGAGC CGTG CT CAGGGGT CCTTG 
AGGGGGCTGTGGTGGCCGGTGAGGGCCAAGGGGAGCTGGAAGGGTCTCTCTTGTTAGCCCAG 
GAAGCC CAGGGACCAG TGGGT CC C C C CGAAAG C CC CTGTGCTTGCAGC AGTGTCC AC CC CAG 

TGTOTAACAGTCCTCCCGGGCTGCCAGCCCTGACTGTCGGGCCCCCAAGTGGTCACCTCCCC 

GTGTATGAAAAGGCCTTCAGCCCTGACTGCTTCCTGACACTCCCTCCTTGGCCTCCCTGTGG 

TGCCAATCCCAGCATGTGCTGATTCTACAGCAGGCAGAAATGCrGGTCCC^^ 

GGAATCTTACCAAGTGCCATCATCCTTCACCTCAGCAGCCCCAAAGGGCT 

ACAGCTCCCCTGACAAAGTGAGGGAGGGCACGTGTCCCTGTGACAGCCAGGATAAAACATCC 

CCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGTGCCCGGCCCAAACTACTTTTTAAAACA 

GCTACAGGGTAAAATCCTGCAGCACCCACTCTGGAAAATACTGCTCTTAATTTTCCTGAAGG 

TGG C C C C CTGTTTCTAGTTGGTCCAGGATTAGGG ATGTGGGGTATAGGG CATTT AAAT CCTC 

TCAAGCGCTCTCCAAGCACCCCCGGCCTGGGGGTGAGTTTCTCATCCCGCTACTGCTGCTGG 

GATCAGGTTGAATGAATGGAACTCTTCCTGTCTGGC CT CCAAAGCAGCCTAGAAGCTGAGGG 

GCTGTGTTTGAGGGGACCTCCACCCTGGGGAAGTCCGAGGGGCTGGGGAAGGGTTTCTGACG 

CCCAGCCTGGAGCAGGGGGGCCCTGGCCACCCCCTGTTGCTCACACATTGTCTGGCAGCCTG 

TGTCCACAATATTCGTCAGTCCTCGACAGGGAGCCTGGGCTCCGTCCTGCTTTAGGGAGGCT 

CTOTCAG^AGGTCCTCTCCCCCATCCCTCCATCT 

CCAGGTGCTGAGATATAATGC^CCAGCACAATAAACCTTTATTCCGGCCTGAAAAAAAAAM 
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA^^ 
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FIGURE 28 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA58852 
xsubunit 1 of 1, 283 aa, 1 stop 
><MW: 29191, pi; 4.52, NX(S/T): 0 

MVSAAAPSIilLLLLLLGSVPATDARSVPLKATFLEDVAGSGEAEGSSASSPSLPPPWTPAL 
SPTSMGPQPTTLGGPSPPTNFLCGIVDFFRQYVMLIAWGSLAFLLMFIVCAAVITRQKQKA 
SAYYPSSFPKKKYVDQSDRAGGPRAFSEVPDRAPDSRPEEALDSSRQLQADILAATQNLKSP 
TRAALGGGDGARMVEGRGAEEEEKGSQEGDQEVQGHGVPVETPEAQEEPCSGVLEGAWAGE 
GQGELEGSLLIiAQEAQGPVGPPESPCACSSVHPSV 

Signal peptide: 

amino acids 1-25 

Transmembrane domain: 

amino acids 94-118 

N-myristoylation site. 

amino acids 18-24, 40-46, 46-52, 145-151, 192-198, 193-199, 
211-217, 238-244, 242-248 
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FIGTJRK 29 

GTGGACTCTGAGAAGCCCAGGCAGTTGAGGACAGGAGAGAGAAGGCTGCAGACCCAGAGGGA 

GGGAGGACAGGGAGTCGGAAGGAGGAGGACAGAGGAGGGCACAGAGACGCAGAGCAAGGGCG 

GCAAGGAGGAGACCCTGGTGGGAGGAAGACACTCTGGAGAGAGAGGGGGCTGGGCAGAGATG 

AAGTTCCAGGGGCCCCTGGCCTGCCTCCTGCTGGCCCTCTGCCTGGGCAGTGGGGAGGCTGG 

CCCCCTGCAGAGCGGAGAGGAAAGCACTGGGACAAATATTGGGGAGGCCCTTGGACATGGCC 

TGGGAGACGCCCTGAGCGAAGGGGTGGGAAAGGCCATTGGCAAAGAGGCCGGAGGGGCAGCT 

GGCTCTAAAGTCAGTGAGGCCCTTGGCCAAGGGACCAGAGAAGCAGTTGGCACTGGAGTCAG 

GCAGGTTCCAGGCTTTGGCGCAGCAGATGCTTTGGGCAACAGGGTCGGGGAAGCAGCCCATG 

CTCTGGGAAACACTGGGCACGAGATTGGCAGACAGGCAGAAGATGTCATTCGACACGGAGCA 

GATGCTGTCCGCGGCTCCTGGCAGGGGGTGCCTGGCCACAGTCGTGCTTGGGAAACTTCTGG 

AGGCCATGGCATCTTTGGCTCTCAAGGTGGCCTTGGAGGCCAGGGCCAGGGCAATCCTGGAG 

GTCTGGGGACTCCGTGGGTCCACGGATACCCCGGAAACTCAGCAGGCAGCTTTGGAATGAAT 

CCTCAGGGAGCTCCCTGGGGTCAAGGAGGCAATGGAGGGCCACCAAACTTTGGGACCAACAC 

TCAGGGAGCTGTGGCCCAGCOTGGCTATGGTTCAGTGAGAGCCAGCAACCAGAATGAAGGGT 

GCACGAATCCCCCACCATGTGGCT CAGGTGGAGG CTCCAGCAACTCTGGGGGAGGCAGCGGC 

TCACAGTCGGGCAGCAGTGGCAGTGGCAGCAATGGTGACAACAACAATGGCAGCAGCAGTGG 
TGGCAGCAGCAGTGGCAGCAGCAGTGGCAGCAGCAGTGGCGGCAGCAGTGGCGGCAGCAGTG 
GTGGCAGCAGTGGCAACAGTGGTGGCAGCAGAGGTGACAGCGGCAGTGAGTCCTCCTGGGGA 
TCCAGCACCGGCTCCTCCTCCGGCAACCACGGTGGGAGCGGCGGAGGAAATGGACATAAACC 
CGGGTGTGAAAAGCCAGGGAATGAAGCCCGCGGGAGCGGGGAATCTGGGATTCAGGGCTTCA 
GAGGACAGGGAGTTTCCAGCAACATGAGGGAAATAAGCAAAGAGGGCAATCGCCTCCTTGGA 
GGCTCTGGAGACAATTATCGGGGGCAAGGGTCGAGCTGGGGCAGTGGAGGAGGTGACGCTGT 
TGGTGGAGTCAATACTGTGAACTCTGAGACGTCTCCTGGGATGTTTAACTTTGACACTTTCT 
GGAAGAATTTTAAATCCAAGCTGGGTTTCATCAACTGGGATGCCATAAACAAGGACCAGAGA 
AGCTCTCGCATCCCGTGACCTCCAGACAAGGAGCCACCAGATTGGATGGGAGCCCCCACACT 
CCCTCCTTAAAACACCACCCTCTCATCACTAATCTCAGCCCTTGCCCTTGAAATAAACCTTA 
GCTGCCCCACAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 30 

></usr/seqdb2/sst/DNA/Dnaaeqs.inin/ss.DNA59212 
xsubunit 1 of l, 440 aa r l stop 
><MW: 42208, pi: 6.36, NX(S/T): 1 

MKFQGPLACLIJ^CLGSGEAGPLQSGEESTGTNIGEALGHGLGDALSEGVGKAIGKEAGGA 
AGSKVSEALGQGTREAVGTG VRQVPGFGAADALGNRVGEAAHALGNTGHE I GRQAEDVI RHG 
ADAVRGSWQGVPGHSGAWETSGGHGIFGSQGGLGGQGQGNPGGLGTPWVHGYPGNSAGSFC^I 
NPQGAPWGQGGNGGPPNFGTNTQGAVAQPGYGSVRASNQNEGCTNPP.PSGSGGGSSNSGGGS 
GSQSGSSGSGSNGDNNNGSSSGGSSSGSSSGSSSGGSSGGSSGGSSGNSGGSRGDSGSESSW 
GSSTGSSSGNHGGSGGGNGHKPGCEKPGNEARGSGESGIQGFRGQGVSSNMREISKEGNRLL 
GGSGDNYRGQGS SWGS GGGDAVGGVNTVNS ETS PGMFNFDTFWKNFKS KLGF I NWD AINKDQ 
RSSRIP 

Signal peptide: 

amino acids 1-21 



N-glycosylation site. 

amino acids 265-269 

Glycosaminoglycan attachment site. 

amino acids 235-239, 237-241, 244-248, 255-259, 324-328, 388-392 
Casein kinase II phosphorylation site. 

amino acids 26-30, 109-113, 259-263, 300-304, 304-308 
N-myristoylation site. 

amino acids 17-23, 32-38, 42-48, 50-56, 60.-66, 61-67, 64-70, 

74-80, 90-96, 96-102, 130-136, 140-146, 149-155, 152-158, 

155-161, 159-165, 163-169, 178-184, 190-196, 194-200, 199-205 

218-224, 236-242, 238-244, 239-245, 240-246, 245-251, 246-252^ 

249-252, 253-259, 256-262, 266-272, 270-276, 271-277, 275-281, 

279-285, 283-289, 284-290, 287-293, 288-294, 291-297, 292-298, 

295-301, 298-304, 305-311, 311-317, 315-321, 319-325, 322-328, 

323-329, 325-331, 343-349, 354-360, 356-362, 374-380, 381-387, 
383-389, 387-393, 389-395, 395-401 

Cell attachment sequence. 

amino acids 301-3 04 
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FIGURE 31 

GA ^°^ CCCTCCGGTC ^ GATGTC ^ 

TG^CTGGCTGGTGGAGTTTCTCTCCTTTGCTGACCATGTTGTTCCCTTGCTGGAATATTACCGGGACATCTTCA 
CTCTCCTGCTGCGCCTGCACCGGAGCTTGGTGTTCTCGCAGGAGAGT6AGGGGAAGATGTGTTTCCTGAACAAGC 

G ^ G ? GGCTC " GGCAC ^ CGCCaGGCC ""TCCACAACCAGCCGCCCTCCTTGCGCCGGACCGTA^ 

^CGTG^GRMGAATTQ5ATCJUlACr6TCTCMACATATQAG6CTRCAC^ 

^ G ^ OTCTCCAAGAG ^^ TC *^^ 

^ctctccgggcgctgcttccagaggagacccckcagccxttct^cagtccagagaacattotgtgggIc 

TTGCAACAGAGAAAGCCTGTGCTTGGCTGTCAGCCAAGATCACAGCACTGATCAGGAGGGAGGTGAAAGCAGCM 

G ^^ CT ^ CMTGGGGCmCGGQACCCTG ^^ 
"^ G J^ CGCTCCGGTGCCGC ^^™ G =^ 



G ^ GGmCTO ^ TGCTCCmCOTG:K ^SGAAGACTTTa 
CTGCTG^GCCCAAGAAATGTGGGGCTTCTGGCAGACACAAGGCCAAGGGAGTGGGACTTGCTGCTATTCTTC 
CGGGAGCTGGTGGAGAAGGGTCTGATGGGACGGATGGAGATAGAGGCCTGCCTGGGCAGCCTCCACCA 
TGGCCAGGGGACTTTGCTGJUGAATTAGCAACACT3TCTAATCTGTTTCT 
C^^GCCTGTGAGTiraTGCAGCCAAACCGTC^ 

^ GC J^ CAOTG ^ CCAGAACCC ^ 
T^GGGTGTAGCTGGGTCTACAGTCAGACTTCra^ 

ATCCTAGAGGAAGGAGAGTTGGCCTGATTTGGGATTATGGCAGAAAAGTCCAGAGATGCCAGTCCTGGAGTAGAA 
^GCTATCCCACXTATCrCTTAAAACTTTGTAGTCTTCKAA^ 

TTATtaAAGAAAGTTAAAACATGAATCTTGGGAGTCTACATTTTCTTATCACCAGGAGCTGGACTGCCATCTCCTT 
ATAAATGCCTAACACAGGCCGGGTCTGGTGGCTCATGCCTGTAATCCCAGCACTTTGAGAGGCCTGAGGTCGGCG 
GACrGCCTGAGGTCAGGAATTCAAGACCAGCCTGGCCAACATGGCAAAACCCCATCTCTACTAAAAATAAAAAAA 
™" AGCTG ^^ GGTCTOTCC ™ TM TCCCAGCTACTCAGGAGGaTGAG^ 

CTGGAGGTGGAGGTTGCAGTGAGCCGAGGTCGCACCACTGCACTCCAGTCTGGGTAACAGAGCGAGACTTTCTAG 
AAAAAGCCTAACAAACAGATAAGGTAGGACTCAACCAACTGAAACCTGACTTTCCCCCTGTACCTTCAGCCCCTC 

CTGGTTTTCTrTAAAAAAAAAAAAAAAAAAAGGGCX^ 

TGG^GTGTCCTGTAGGGAAAGGCCCTGTTTTCCCTGAGGCGGGGCTGGGCTTGTC^ 

GG ™T^ gccc ^ cgtgtctctagctcc " c " gccggg ^ c ^ g ^c^ 

^^^^^^^^^^^^^^^^^^^^^^^^^^^G^GCCTGAGGTGCTCCTGAGATGCTG 
n«^^^^^^^ GG ^ GG ^ GA ^^ G ^ GTGGC ^ GG ^^^^^^^^^^^G^CTGGGGAAACTAAGCTC 

°!^^^r rccAAAGAccGAGGATC 

^ GAA ^^^ CGT ^ GGTGTCTCAG ^ 
CTtSCGCTCGGGAGTGCGC^ 

CCTCACAGGAAGTTGGGCTCCCGCACCACCAGGCAGGGGGGGCTCCCGCCGCCGCCGCCGCCACCACCGTCCAGG 

~5^ tagacaaagtcgaagtcgcgctogggctcgct ^ 

TCGTCCGCCAGCTGGAAGCAGCGCCCGTCCACCAGCACGAACAGCCGGTGCGCCT 
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MCFLNKLLLLAVLGWLFQIPTVPEDLFFl^EG 

CPYIGELRKLLASWVSGSSGRSGGFMRKITPTTTTSLGAQPSQTSQGLQAQLAQAFFHNQPP 
SLRRTVE FVAERI GSNCVKH I KATLVADLVRQ AE SLLQEQLVTQGEEGGD PAQLLE I LCSQL 

CPHGAQATxALGREFCQRKSPGAVRALLPEETPAAVLSSAENIAVGLATEKACAWLSANITAL 
IRREVKAAVSRTLRAQGPEPAARGERRGCSRA 

Signal peptide: 

amino acids 1-18 

N-glycosylation site. 

amino acids 244-248 

CAMP- and cGMP -dependent protein kinase phosphorylation site. 

amino acids 89-93 

Casein kinase II phosphorylation site. 

amino acids 21-25, 167-171, 223-227 

N-myristoylation site. 

amino acids 100-106, 172-178, 207-213 

Microbodies C- terminal targeting signal. 

amino acids 278-282 
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FIGURE 33 

TCCCTTGACAGGTCTGGTGGCTGGTTCGGGGTCTACTGAAGGCTGTCTTGATCAGGAAACTG 
AAGACTCTCTGCTTTTGCCACAGCAGTTCCTGCAGCTTCCTTGAGGTGTGAACCCACATCCC 

TGCCCCCAGGGCCACCTGCAGGACGCCGACACCTACCCCTCAGCAGACGCCGGAGAGAAMS 
AGTAGCAACAAAGAGCAGCGGTCAGCAGTGTTCGTGATCCTCTTTGCCCTCATCACCATCCT 
CATCCTCTACAGCTCCAACAGTGCCAATGAGGTCTTCCATTACGGCTCCCTGCGGGGCCGTA 
GCCGCCGACCTGTCAACCTCAAGAAGTGGAGCATCACTGACGGCTATGTCCCCATTCTCGGC 
AACAAGACACTGCCCTCTCGGTGCCACCAGTGTGTGATTGTCAGCAGCTCCAGCCACCTGCT 
GGGCACCAAGCTGGGCCCTGAGAT CGAG CGGGCTGAGTGTACAATCCGCATGAATGATGCAC 
C CAC CACTGGCT ACTCAG CTGATGTGGGCAACAAGACC AC CT ACCGCGT CGTGG CCCATT C C 
AGTGTGTTC C G CGT GCTGAGGAGGCC CC AGGAGTTTGT CAACCGGAC CC CTGAAAC CGTGTT 
CATCTTCTGGGGGCCCCCGAGCAAGATGCAGAAGCCCCAGGGCAGCCTCGTGCGTGTGATCC 
AGCGAGCGGGCCTGGTGTTCCCCAACATGGAAGCATATGCCGTCTCTCCCGGCCGCATGCGG 
CAATTTGACGACCTCTTCCGGGGTGAGACGGGCAAGGACAGGGAGAAGTCTCATTCGTGGTT 
GAGC AC AGG CTGGTTT AC CATG GTGATCGCGGTGGAGTTGTGTGAC CACGTG CATGT CTATG 
GbvTGGTCCCCCCO^CTACTGCAGCCAGCGGCCCCGCCTCCAGCGCATGCCCTACCACTAC 
TA CG AG CC CAAGGGGC CGGACGAATGTGT CACCT ACAT CCAG AATG AGCACAGT CG CAAGGG 
CAACCA.CCACCGCTTCAT»CCGAGAAAAGGGTCTTCTCATCGTGGGCCCAGCTGTATGGCA 
TCAC CTTCTCC CAC CC CTCCTGGACCTAGGCCAC CCAG CCTGTGGG AC CT CAGG AGGGTCAG 
AGGAGAAGC AG CCT CCGCCCAGCCGCTAGG CCAGGG ACCAT CTT CTGGC C AAT CAAGGCTTG 
CT GGAGTGT CT CCCAGCCAATCAGGGCCTTGAGG AGGATGT ATC CT C C AG CC AATC AGGGCC 
TGGGGAATCTGTTGGCGAATCAGGGATTTGGGAGTCTATGTGGTTAATCAGGGGTGTCTTTC 
TTGTGCAGTCAGGGTCTGCG CACAGTCAAT CAGGGTAGAGGGGGTATTTCTGAGTCAATCTG 
AGGCTAAGGACATGTCCTTT CC CATGAGGCCTTGGTTC AGAG CC CCAGGAATGGAC CCCCCA 
ATCACTCCCCACTCTGCTGGGATAATGGGGTCCTGTCCCAAGGAGCTGGGAACTTGGTGTTG 
CC CCCT CAATTT CCAG CA CCAG AAAGAGAGATTGTGTGG GGGTAGAAG CTGTCTGGAGGC CC 
GGCCAGAGAATTTGTGGGGTTGTGGAGGTTGTGGGGGCGGTGGGGAGGTCCCAGAGGTGGGA 
GGCTGGCATCCAGGTCTTGGCTCTGCCCTGAGACCTTGGACAAACCCTTCCCCCTCTCTGGG 
CACCCTTCTGCCCACACCAGTTTCCAGTGCGGAGTCTGAGACCCTTTCCACCTCCCCTACAA 
GTGCCCTCGGGTCTGTCCTCCCCGTCTGGACCCTCCCAGCCACTATCCCTTGCTGGAAGGCT 
C^GCTCTTTGGGGGGTCTGGGGTGACCTCCCC^CCTCCTG^ 

GCAAACTC CTT C AGGG TTGGGG GACTCTGAAGGAAACGGG ACAAAAC CTTAAG CTGTTTT CT 
TAGCCCCTCAGCCAGCTGCCATTAGCTTGGCTCTTAAAGGGCCAGGCCTCCTTTTCTGCCCT 
CT AGCAGGGAGGTTTT CCAACTGTTGGAGGCGCCTTTGGGGCTG CC C CTTTG TCTGGAGTCA 
CTGGGGGCTTCCGAGGGTCTCCCTCGACCCTCTGTCGTCCTGGGATGGCTGTCGGGAGCTGT 
ATCACCTGGGTTCTGTCCCCTGGCTCTGTATCAGGCACTTTATTAAAGCTGGGCCTCAGTGG 
GGTGTGTTTGTCTCCTGCTCTTCTGGAGCCTGGAAGGAAAGGGCTTCAGGAGGAGGCTGTGA 
. GG CTGGAGGGAC CAGATGGAGGAGGC CAGCAG CT AGC CATTGCACACTGGGGTGATGGGTGG 
GGGCGGTGACTG C C CCAGACTT GGTTTTGT AATGATTT GT ACAGGAAT AAACAC ACCTACGC 
TCCGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 34 

MSSNKEQRSAVFVILFALITILILYSSNSANEVFHYGSLRGRSRRPVNLKKWSITDGYVPIL 
GNKTLPSRCHQCTIVSSSSHUiGTKLGPEIERAECTIRMNDAPTTGYSADVGNKTTYRVVAH 
SSVFRVLRRPQEFVNRTPETVFIFWGPPSKMQKPQGSLVRVIQRAGLVFPNMEAYAVSPGRM 
RQFDDLFRGETGKDREKSHSWLSTGWFTMVIAVELCDHVHVYGMVPPNYCSQRPRLQRMPYH 
YYE PKGPDECVTY I QNEHSRKGNHHRF ITE KRVFS SWAQLYG I TFSHPS WT 

Signal peptide; 

amino acids 1-29 

Transmembrane domain: 

amino acids 9-31 (type II) 

N-glycosylation site. 

amino acids 64-68, 115-119 

CAMP- and cGMP- dependent protein kinase phosphorylation site. 

amino acids 50-54 

Casein kinase II phosphorylation site. 

amino acids 3-7, 29-33, 53-57, 197-201 

Tyrosine kinase phosphorylation site. 

amino acids 253-262 

N-myristoylation site. 

amino acids 37-43, 114-120, 290-294 
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FIGURE 35 

GTTTCTCATAGTTGGCGTCITCTAAAGGAAAAAC^ 

^GGGAAGCATCCCTAGCTGTTGGCGCAGAGGGGCGAGGCTGAAGCCGAGTGGCCCGAGG 

GG CAAAGGTG AAAGAGTTTCAGAACAAG GTT C CTGGAACC CATGAC C CATGAAGT C TTGTCGACATTTATAC CGT 

CTGAGGGTAGCAGCTCGAAACTAGAAGAAGTGGAGTGTTGCCAGGGACGGCA^ 

GGCCTATGGGACGTTGGCTTCAGACCm^ 

AGGCCTGAGGTCACACTGGCTTGCCTCCTCCTAGCCACAGCAGGCTGCTTTGCTGACTTGAAra 

GTCACCGTCCAGCCTGCGTCCACCGTCCAGAAGCCCGGAGGCACTGTGATCTTGGGCTGCGTGGTGGAACCTCCA 

AGGATGAATGTAACCTGGCGCCTGAATGGAAAGGAGCTGAATGGCTCGGATGATGCTCTGGGTGTCOT 

CACGGGACCCTCGTCATCACTGCCCTTAACAACCACACTGTGGGACGGTACCAGTGTGTGGCCCGGATGG 

GGGGCTGTGGCCAGCGTGCCAGCCACTCTGACACTA 

ATTGAAGTGGATGAGGGAAACACAGCAGTCArrGCCTGCCACCTGCCTGAGAG 

TACAGCGTCAAACAAGAGTGGCTGGAGGCCTCCAGAGGTAACTACCTGATC^TGCCCTCAGGGAACCTCCAGATT 

GTGAATGCCAGCCAGGAGGACGAGGGCATGTACAAGTGTGCAGCCTACAACCCAGTGACCCAGGAAGTGAAAACC 

TCCGGCTCCAGCGACAGGCTACGTGTGCGCCGCTCCACCGCTGAGGCTG CC CGCATCATCTACCCCCCAGAGGCC 

CAAACCATCATCGTCACCAAAGGCCAGAGTCTCATTCTGGAGTGTGTGGCCAGTGGAATCCCACCCCCACGGGTC 

AC CTGGG C CAAGGATGGGTC CAGTG TCACCGGCTACAACAAG AC GC G CTTCCTGCTGAGCAACCTC CTCATCG AC 

ACCACC^GCGAGGAGGACTCAGGCACCTACCGCTGCATGGCCGACAATC 

ATCCTCTACAATGTCCAGGTGTTTGAACCCCCTGAGGTCACCATGGAGCT^ 

CAGAGTGCCAAGCTTACCTGTGAGGTGCGTGC5GAACCCCCCGCCCTCCGTGCTGTGGCTGAG 

CTCATCTCCAGCCAGCGCCTCCGGCTCTCCCGCAGGGCCCTC 

GTCTACCAGTGCATGGCCGAGAACCAGGTTGGGAGCGCCCATGCCG^ 

ATAACCCCAAGGCTATGGCAGGATGCrGAGCTGGCTACTGGCACACCT 

CCTGAGCAGATGCTGAGGGGGCAACCGGCGCTCCCCAGACCCCC^ 

CCAGGAGAGAAGGGGCAGGGGGCTCCCGCCGAGGCTCCCATCATC CTTCAGCTCG CC CCGCACCTCCAAGACAGAC 

TCATATGAACTGGTGTGGCGGCCTCGGCATGAGGGCAGTGGCCGGGCGCCAATCCTCTACT 

CGCAAGCAGGTCACAAATTCCTCTGACGATTGGACCATCTCTGGCAT^ 

ACCAGACTTGACCCCGGGAGCTTGTATGAAGTGGAGATGGCAGCTTACAACTGTGCGGGAGAGGGCCA^ 
ATGGTCACCTTC CG AACTGGACGGCGGCCCAAACCCGAGATCATGGCCAGCAAAGAGCM CAGAGAGAC 
GACCCTGGAGCCAGTCCCCAGAGCAGCAGCCAGCCAGACCACGGCCG^ 

CCCACCATCTCCACGGCCTCCGAGACCTCAGTGTACGTGACCTGGATTCCCCGTGGGAATGGTGGGTTCCCAATC 

CAGTCCTTCCGTGTGGAGTACAAGAAGCTAAAGAAAGTGGGAGACTGGATTCT^ 

TCGCGGCTGTCCGTGGAGATCACGGGCCTAGAGAAAGGCACCTCCTACIAAGTTTCX3AG 

CTGGGGGAGAGCGAGCCCAGCGCCCCCTCTCGGCCCTACGTGGTGTCOT 

CCCGTGGCAGGTCCTTATATCACCTTCACGGATGCGGTCAATGAGACCACCATCATGCTC^ 

CCAGCAACTAACAACAACACCCCAATCCATGGCTTrTATATCTATTATCG^ 

GACTACAAGAAGGATATGGTGGAAGGGGACAAGTACTGGCACTCCATCAGCCACCT 

GACATTAAGATGCAGTGCTTCAATGAAGGAGGGGAGAGCGAGTTCAGCAACGTGATGATCT 

CGGAAGTCITCTGGCCAGCCTGGTCGACTGCCACCCCCAACTCTGGCCCCACCA 

ATAGAGTOGCCGCTGGGCACTCGGGCCATGGT^ 

CTGGGCTCCATCGTTCTCATCATCGTCACCTTCATCCCCTTCTGCTTG 

ACAACAGACCTGGGTTTTCCTCGAAGTGCCCTTCCACCCT^ 

CCAGGCCACCAGG C CAGTGGACAGC C CT AC CT GAG TG G CATCAGTGGACGGG CCTGTGCTAATGGGATCCACATG 
AATAGGGGCTGCCCCTCGGCTG CAGTGGGCTACC CGGGCATGAAGCCC CAGCAGCACTGCCCAGGCGAG CTTCAG 
CAGCAGAGTGACACCAGCAGCCTGCTGAGGCAGACCCATCTTGGC^TGGATATGACC 

ACGAGGGGTCCCAAGTCTAGCCCGGACGAGGGCTCTTTCTTATACACACTGCCCGACGACTCCACTCACCAGCTG 

CTTGCAGCCCCATCACGACTGCTGCCAACGCCAGGAGCAGCCTGCTGCTGTGGGCCAGTCAG 

CCCGACAGTCCTGTCCTGGAAGCAGTGTGGGACCCTCCATTTCACTCAGGGCCCCCATGC 

CCAGTTGAAGAGGTGGACAGTCCTGACTCCTGCCAAGTGAGTGGAGGAGACTGGTGTCCCCA 

GCCTACGTAGGACAGXIAACCTGGAATGCAGCTCrCCCCGGGGCCACT 

CTCACAATTTAGGCAGAAGCTGATATCCCAGAAAGACT 

AG fS^SfS AGAAAATTGG TATTT AT TTTT CT ATTATAGC C ATATTTATATATTT ATG CACTTG T AAAT AAATG TA 
TATGTTTTAT AATTCTGG AGAGACAT AAGGAGTC CTACC CGTTG AGGTTG GAGAGGGAAAATAAAGAAG CTG C CA 
CCTAACAGGAGTCACCCAGGAAAGC^CCGCACAGGCTGGCGCGGGACAGACTCCTAACCTGGGGCCTCTGCAGTG 
GCAG GCGAGG CTG C AGGAGGCC CACAGATAAG CTGGC AAGAGGAAGGATCCCAGGCACATGGTT CAT CACGAG C A 
TGAGGGAACAG CAAGG GG CACGGTATC ACAG CCTGGAG AC ACCCACACAGATGGCTGGATCCG GTGCTAC GGGAA 
ACATTTTCC T AAG ATGC C CATGAGAAC AGAC CAAG ATGTGTACAGCACTATGAGCATTAAAAAAC C TTC CAGAAT 
CAATAATCCGTGGCAACATATCTCTGTAAAAACAAACACTGTAACTTCT 
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FIGURE 36 

MLRGTMTAWRGMRPEVTLACIJ^TAGCFADLNEVPQVTVQPASTVQKPGGTVILGCVVEPP 
RMNVTWRLNGKE LNGSDDALG VL I THGTLV I TALNNHT VGRYQCVARMPAGA VAS VP ATVTL 
ANLQDFKLDVQHVIEVDEGNTAVIACHLPESHPKAQVRYSVKQEWLEASRGfTYLIMPSGNLQ 
I VNASQEDEGMYKCAAYNPVTQEVKTSGSSDRLRVRRSTAEAARI I YPPE AQTI I VTKGQSL 
ILECVASGIPPPRVTWAKDGSSVTGYNKTRFLLSNLLIDTTSEEDSGTYRCMADNGVGQPGA 
AVILYWQVFEPPEVTMELSQLVIPWGQSAKLTCEVRGNPPPSVLWIJ^VPLISSQRLRLS 
RRALRVLSMGPEDEGVYQCMAENEVGSAHAWQLRTSRPSITPRLWQDAELATGTPPVSPSK 
LGNPEQMLRGQPALPRPPTSVGPASPKCPGEKGQGAPAEAPIILSSPRTSKTDSYELVWRPR 
HEGSGRAPILYYVVKHRKQVTNSSDDWTISGIPANQHRLTLTRLDPGSLYEVEMAAYNCAGE 
GQTAMVTFRTGRRPKPEIMASKEQQIQRDDPGASPQSS SQ PDHGRLSPPEAPDRVTISTASE 
TSVYVTWIPRGNGGFPIQSFRVEYKKLKKVGDWILATSAIPPSRLSVEITGLEKGTSYKFRV 
RALNMI^ESEPSAPSRPYWSGYSGRVYERPVAGPYITFTDAVNETTIMLKWMYIPASNNNT 
PIHGFYIYYRPTDSDNDSDYKKDMVEGDKYWHSISHLQPETSYDIKMQCFNEGGESEFSNVM 
ICETKARKSSGQPGRLPPPTLAPPQPPLPETIERPVGTGAMVARSSDLPYLIVGVVLGSIVL 
I IVTFI PFCLWRAWSKQKHTTDLGFPRSALPPSCPYTMVPLGGLPGHQASGQPYIiSGISGRA 
CANGIHMNRGCPSAAVGYPGMKPQQHCPGELQQQSDTSSLLRQTHLGNGYDPQSHQITRGPK 
SSPDEGSFLYTLPDDSTHQLLQPHHDCCQRQEQPAAVGQSGVRRAPDSPVLEAVWDPPFHSG 
PPCCLGLVPVEEVDSPDSCQVSGGDWCPQHPVGAYVGQEPGMQLSPGPLVRVSFETPPLTI 

Signal peptide: 

amino acids 1-30 

Transmembrane domain : 

amino acids 16-30 (type II), 854-879 
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FIGUR E 37 

CGGGAGGCTGGGTCGTCATGATCCGGACCCCATTGTCGGCCTCTGCCCATCGCCTGCTCCTC 
CCAGGCTCCCGCGGCCGACCCCCGCGCAAC^TGCAGCCCACGGGCCGCGAGGGTTCCCGCGC 
GCTCAGCCGGCGGTATCTGCGGCGTCTGCTGCTCCTGCTACTGCTGCTGCTGCTGCGGCAGC 
CCGTAACCCGCGCGGAGACCACGCCGGGCGCCCCCAGAGCCCTCTCCACGCTGGGCTCCCCC 
AGCCTCTTCACCACGCCGGGTGTCCCCAGCGCCCTCACTACCCCAGGCCTCACTACGCCAGG 
CACCCCCAAAACCCTGGACCTTCGGGGTCGCGCGCAGGCCCTGATGCGGAGTTTCCCACTCG 
TGGACGGCCACAATGACCTGCCCCAGGTCCTGAGACAGCGTTACAAGAATGTGCTTCAGGAT 
GTTAACCTGCGAAATTTCAGCCATGGTCAGACCAGCCTGGACAGGCTTAGAGACGGCCTCGT 
GGGTGCCCAGTTCTGGTCAGCCTCCGTCTCATGCCAGTCCCAGGACCAGACTGCCGTGCGCC 
TCGCCCTGGAGCAGATTGACCTCATTCACCGCATGTGTGCCTCCTACTCTGAACTCGAGCTT 
GTGACCTCAGCTGAAGGTCTGAACAGCTCTCAAAAGCTGGCCTGCCTCATTGGCGTGNAGGG 
TGGT CACT CACTG GACAGC AG C CTCT CTGTGCTGCGCAGTTTCT ATGTGCTGGGGGTGCGCT 
ACCTGACACTTACCTT CAC CTGCAGTACAC CATGGG CAGAGAGTTC C ACCAAGTT CAGACAC 
CACAT GTACA CCAACGT CAG C GGATT GA CAAG CTTT GG T GAG AAAG T AGT AG AGGAGTTG AA 
CCGCCTGGGCATGATGATAGATTTGTCCTATGCATCGGACACCTTGATAAGAAGGGTCCTGG 
AAGTGTCTCAGGCTCCTGTGATCTTCTCCCACTCAGCTGCCAGAGCTGTGTGTGACAATTTG 
TTGAATGTT C CCGATGATATCC TG CAGCTT CT GAAGAACGGTGG CATCGTGATGGTGACACT 
GTCCATGGGGGTGCTGCAGTGCAACCTGCTTGCTAACGTGTCCACTGTGGCAGATCACTTTG 
ACCACATCAGGG CAGT CATTGG AT CTGAGTTCATCGGGATTGGTGGAAATTATGACGGGACT 
GGCCGGTTCCCTCAGGGGCTGGAGGATGTGTCCACATACCCAGTCCTGATAGAGGAGTTGCT 
GAG TCGTAS CTGGAGCGAGGAAGAGC TT CAAGGTGTCCTTCGTGGAAACCTG CT GCGGGTCT 
TCAGACAAGTGGAAAAGGTGAGAGAGGAGAGCAGGGCGCAGAGCCCCGTGGAGGCTGAGTTT 
CCATATGGGCAACTGAGCACATCCTGCCACTCCCACCTCGTGCCTCAGAATGGACACCAGGC 
TACTCATCTGGAGGTGACCAAGCAGCCAACCAATCGGGTCCCCTGGAGGTCCTCAAATGCCT 
CCCCATACCTTGTTCCAGGCCTTGTGGCTGCTGCCACCATCCCAACCTTCACCCAGTGGCTC 
TGCTQACACAGTCGGTCCCCGCAGAGGTCACTGTGGCAAAGCCTCACAAAGCCCCCTCTCCT 
AGTTCATTCACAAG CATATG CTGAGAATAAACATGTTACACATGG AAAA 
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FIGURE 38 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA59817 
xsubunit 1 of 1, 487 aa, 1 stop, 2 unknown 
><MW: 53569.32, pi: 7.68, NX (S/T) : 5 

MQPTGREGSRALSRRYIiliUjLLLLLLLLLRQPWRAETTPGAPRALSTLGSPSLFTTPGVPS 
ALTTPGLTTPGTPKTLDLRGRAQALMRSFPLVDGHNDLPQVLRQRYKNVLQDVNLRNFSHGQ 
TSLDRLRDGLVGAQFWSASVSCQSQDQTAVRLALEQIDLIHRMCASYSELELVTSAEGLNSS 
QKLACLIGVXGGHSIJDSSLSVLRSFYVLGVRYLTLTFTCSTPWAESSTKFRHHMYTOVSGIiT 
SFGEKVVEELNRLGMMIDLSYASDTLTRRVLEVSQAPVI^^ 

LKNGGIVMVTLSMGVLQCNLLANVSTVADHFDHIRAVIGSEFIGIGGNYDGTGRFPQGLEDV 
S T Y P VL I E ELLS RXWS EEELQG VLRGNLLRVFRQVEKVREE SRAQ S P VEAE FPYGQLSTSCH 
SHLVPQNGHQATHLEVTKQPTNRVPWRS SNAS PYLVPGLVAAAT I PTFTQWLC 

Important features of the protein: 
Signal peptide: 

amino acids 1-36 

Transmembrane domain: 

amino acids 313-331 

N-glycosylation sites. 

amino acids 119-122, 184-187, 243-246 and 333-336 
N-myriBtoylation sites. 

amino acids 41-46, 59-64, 73-78, 133-138, 182-187, 194-199, 324- 
329, 354-359, 357-362, 394-399, 427-432 and 472-477. 

Prokaryotic membrane lipoprotein lipid attachment site. 

amino acids 136-146 
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FIGURE 39 

TGCTAGGCTCTGTCCCACAATGCACCCGAGAGCAGGAGCTGAAAGCCTCTAACACCCACAGA 

TCCCTCTATGACTGCAATGTGAGGTGTCCGGCTTTGCTGGCCCAGCAAGCCTGATAAGCA£S 
AAGCTCTTATCTTTGGTGGCTGTGGTCGGGTGTTTGCTGGTGCCCCCAGCTGAAGCCAACAA 
GAGTTCTGAAGATATC CGGTGC AAATGCAT CTGT CC AC CTTATAGAAACAT CAGTGGG CACA 
TTTACAAC CAGAATGT AT C C C AGAAGGACTGC AACTGC CTG C ACGTGGTGGAG C CCATG CCA 
GTGCCTGGCCATGACGTGGAGGCCTACTGCCTGCTGTGCGAGTGCAGGTACGAGGAGCGCAG 
CACCACCACCATCAAGGTCATCATTGTCATCTACCTGTCCGTGGTGGGTGCCCTGTTGCTCT 
ACATGGCCTTCCTGATGCTGGTGGACCCTCTGATCCGAAAGCCGGATGCATACACTGAGCAA 
CTGCACAATGAGGAGGAGAATGAGGATGCTCGCTCTATGGCAGCAGCTGCTGCATCCCTCGG 
GGGACCCCGAGCAAACACAGTCCTGGAGCGTGTGGAAGGTGCCCAGCAGCGGTGGAAGCTGC 
AGGTGCAGGAGCAGCGGAAGACAGTCTTCGATCGGCACAAGATGCTCAGCTAGATGGGCTGG 
TGTGGTTGGGTCAAGGCCCCAACACCATGGCTGCCAGCTTCCAGGCTGGACAAAGCAGGGGG 
CTACTTCTCCCTTCCCTCGGTTCCAGTCTTCCCTTTAAAAGCCTGTGGCATTTTTCCTCCTT 
CTCCCTAACTTTAGAAATGTTGTACTTGGCTATTTTGATTAGGGAAGAGGGATGTGGTCTCT 
GATCTCTGTTGTCTTCTTGGGTCTTTGGGGTTGAAGGGAGGGGGAAGGCAGGCCAGAAGGGA 
ATGGAGACATTCGAGG CGG CCTCAGGAGTGGATG CGAT CTGTCTCT C CTGGCT C CACTCTTG 
CCGCCTTCCAGCTCTGAGTCTTGGGAATGTTGTTACCCTTGGAAGATAAAGCTGGGTCTTCA 
GGAACTCAGTGTCTGGGAGGAAAGCATGGCCCAGCATTCAGCATGTGTTCCTTTCTGCAGTG 
GTTCITATCAC»CCTCCCTCCCAGCCCCGGCGCCTCAGCCCCAGCCCCAGCTCCAGCCCTG 
AGGACAGCTCTGATGGGAGAGCTGGGCCCCCTGAGCCCACTGGGTCTTCAGGGTGCACTGGA 
AGCTGGTGTTCGCTGTCCCCTGTGCACTTCTCGCACTGGGGCATGGAGTGCCCATGCATACT 
CTGCTGCCGGTCCCCTCACCTGCACTTGAGGGGTCTGGGCAGTCCCTCCTCTCCCCAGTGTC 
CACAGTCACTGAGCCAGACGGTCGGTTGGAACATGAGACTCGAGGCTGAGCGTGGATCTGAA 
CACCAC^GCCCCTGTACTTGGGTTGCCTCTTGTCCCTGAACTTCGTTGTACCAGTGCATGGA 
GAGAAAATTTTGTCCTCTTGTCTTAGAGTTGTGTGTAAATCAAGGAAGCCATCATTAAATTG 
TTTTATTTCTCTCA 
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FI GURE 40 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA60278 
<aubunit 1 of 1, 183 aa, 1 stop 
<MW: 20574, pi: 6.60, NX(S/T): 3 

MKLLSLVAWGCLLVPPAEANKSSEDIRCKCICPPYRNISGHIYNQWSQKDCNCLHVVEPM 
PVPGHDVEAYCLLCECRYEERSTTTIKVIIVIYLSWGALLLYMAFLMLVDPLIRKPDAYTE 
QLHNEEENEDARSMAAAAASLGGPRANTVLERVEGAQ 

Important features: 
Signal peptide: 

amino acids 1-20 

Transmembrane domain: 

amino acids 90-112 

N-glycosylation sites. 

amino acids 21-24, 38-41 and 47-50 
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FIGURE 41 

AGCX^SGTCTrCGCTTGGGTTCCGCT 
TCCCTTTGCATTCCCACCCCTCCGGGCTTTGCGTC^ 

CGGAGCAAGGATTCGTCCTGCTGCCTGCTCCTACTGGCCGCGGTGCTGATGGTGGAGAGCTCACAGATCGGCAGT 
TCGCGGGCCAAACTCAACTCCATCAAGTCCTCTC7GGGCGGGGAGACGCCTGGTCAGGCCGCCAATCGATCT 
GGCATGTACCAAGGACTG^CATTCGGCGGCAGTAAGAAGGGCAAAAACCTG GG GC AGGCCTACCCTTGTAGCAGT 
GATAAGGAGTGTGAAGTTGGGAGGTATTGCCACAGTCCCCACCAAGGATCATCGGCCTGCATGGTGTGTCGGAGA 
AAAAAGAAG CGCTGCCACCGAGATGGCATGTG CTGCCCCAGTACCCGCTGCAATAATGGCATCTGTATCCCAGTT 
ACTGAAAGCATCTTAACCCCTCACATCCCGG CTCTGGATGG TACTCGGCACAG AGATCG AAACCACGGTCATTAC 
TCAAACCATGACTTGGGATGGCAGAATCTAGGAAGACCACACACTAAGATGTCACATATAAAA 
GACCCCTGCCTACGATCATCAGACTGCATTGAAGGGTTTTGCTGTGCTCGTCA 
CCAGTGCTCCATCAGGGGGAAGTCTGTACCAAACAACGCAAGAAGGGTrCTCATC 

TGCGACTGTGCGAAGGGCCTGTCTTGCAAAGTATGGAAAGATGCCACCTACTCCTCCAAAGCCAGA ^ 

TGTCAGAAAATTTSATCACCATTGAGGAACATCATCAATTGCAGACTGTGAAGTTGT^ 

CATGGTGGAAAATAAGGTTCAGATGCAGAAGAATGGCTAAAATAAGAAACGTGATAAG 

AAAGGGAGAAAGAAAAC ATGAACTGAAT AGATTAGAATGGGTGAC AAATG CAGTG CAG CCAGTG TTTCCATTATG 

CAACTTGT CTATGTAAATAATGTACACATTTGTGG AAAATG CTATT ATTA^ CACAC AG TGGAAATT 

ACTGATGAGTAGCATGTGACTTTCCAAGAGTTTAGGTTGTGCTGGAGGAGAGGTTTCCTTCA 

TTATACAAATAACCTACATGCCAGATTTCTATTCAACGTTAGAGTTTAACAAAATACTCCTAGAATAACTTGTTA 

TACAAT AGGT TCT AAAAATAAAATTGCT AAACAAGAAATG AAAACATGG AG CATTGTT AATTTACAACAGAAAAT 

TACCTTTTGATTTGTAACACTACTTCTGCTGTTCAATCAAGAGTCTTGGTAGATAA 

TTCCAAATAATTGCAAAATAATGGCCAGTTGTTTAGGAAGGCCTTTAGGAAG^ 

C CACAAATAC TTlU"rri'TCAAAATTTTAGTITTACCTGTAATTAATAAGAAC TG AT ACAAGACAAAAACAGTTC C 
TTCAGATTCTACGGAATGACAGTAT AT CT CTCTTTATCC TATGTGATTCCTGC TCTG AATGCATTATATTTTCC A 
AACTATAC CCATAAATTGTGACTAGTAAAATAC TTACACAGAGCAGAATTTTCACAGATGGCAAAAAAATTTAAA 
GATGTC CAATATATGTGGGAAAAGAGCTAACAGAGAGATCAT TATTTCTT AAAGATTGG C CATAAC CTATATTTT 
GATAGAATTAGATTGGTAAATACATCTATTCATACAT^ 
CACTGGAGTAAG<^GAAAATTGGGAAAACTTTTTCGTTT^ 

AGG CACAAGTTGG CTGTTCATCTTTGAAAC CAGGGGATGCACAGTCTAAATGAATATCTGCATG GGATTTGCTAT 
CATAATATTTACTATG CAGATGAATTCAGTGTGAGGTCCTGTGT CC<5TACTATC CTC AAATTATTT ATTTTATAG 
TGCTGAGATCCTCAAATAATCTCAATTTCAGGAGGTTTCA 
TTTCATTGCCCTCTATAAGCITCTGACTAGCCAATGGCAT^ 

CTTTATTG CCAAAGGG CTAGTTTCGGT TTT CTG CAGCCATTG CG G TTAAAAAAT ATAAGT AGGATAACTTGTAAA 
AC CTGCATATTGCT AAT C TATAG ACAC CACAGT TTCTAAATTCTT TGAAACCACTTTACTACTTT I'l'lTAAACTT 
AACTCAGTTCTAAATACTTTGTCTGGAGCACAAAACAATAAAATO 

TAGACC^CAATTGAu"l-l"l-lTAGTTTTCTTTTACTTAAATCCCAT CTGCAGTCT CAAATTTAAGTT CTC C CAGTAG 
AGATTGAGTTTGAGCCTGTATATCTATTAAAAATT^ 

CATTTTCTGCACAGGTCTGCAAAAACAAAAATTATAAACTAGTCC^TCCAAG 
TGCTATAAGCTTGTGAAATGAAAATGGAACATTTCAATCAAA 
TTGGTTTCTGCAATATTTTTCTTATGTCCACCCTTTTAAAAATTAT 
TTAATGAGATGTATTTTCTTATAGAGATATTT^ 

TTTCTAATTTAGGAAAAATGTATAATAAGATAAAATCTATTAAATTTTTCTCCT 
AAAAAAAAAAAAAAAAAAAA 
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FIGURE 42 

MAALMRS KBS S C CLLLLAAVLMVE S S Q I GS S RAKLNS I KS SLGGE T PGQAANRS AGM YQGLA 
FGGSKKGKNLGQAYPCSSDKECEVGRYCHSPHQGSSACMVCRRKKKRCHRDGMCCPSTRCNN 
GI C I PVTES I LTPH I P ALDGTRHRDRNHGHYSNHDLGWQNLGRPHTKMSH I KGHEGDPCLRS 
SDCIEGFCCARHFWTKICKPVLHQGEVCTKQRKKGSHGLEIFQRCDCAKGLSCKVWKDATYS 
SKARLHVCQKI 

Signal peptide: 

amino acids 1-25 



VI f 2.70 
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FIGURE 43 

TCTCAATCTGCTGACCTCGTGATCCGCCTGACCTTGTAATCCACCTACCTTGGCCTCCCAAA 
GTGTTGGGATTACAGGCGTGAG CC AC C G CG CC CG G C CAAC AT CACGTTTT TAAAAATTG ATT 
TCTTCAAATTCATGGCAAATATTTCCCTTCCCTTTAACTTCTTATGTCAGAATGAGGAAGGA 
TAGCTGCATTTATTTAGTCAGTTT TCATTG CATAGT AATATTTT CATGTAGTATTTTCT AAG 
TTATATTTTAGTAATTCATATGTTTTAGATTATAGGTTTTAACATACTTGTGAAAATACTTG 
ATOTGTTTTAAAGCCTTGGGCAGAAATTCTGTATTGTTGAGGATTTGTTCTTTTATCCCCCT 
TTTAAAGTCATCCGTCCTTGGCTCAGGArrTGGAGAGCTTGCACCACCAAAAATGGCAAACA 
TCACCAGCTCCCAGATTTTGGACCAGTTGAAAGCTCCGAGTTTGGGCCAGTTTACCACCACC 
CCAAGT AC ACAGCAGAATAGTACAAGTCAC CCTACAACTACTACTTCTTGGGACCT CAAGCC 
CCCAACATCCC^GTCCTCAGTCCTCAGTCATCTTGACTTCAAATCTCAACCTGAGCCATCCC 
CAGT TC TTAGCCAGTTGAGC CAG CG ACAACAG CAC CAGAG C C AGG CAGTC ACTG TTC CTC CT 
CCTGGTTTGGAGTCCTTTCCTTCCCAGGCAAAACTTCGAGAATCAACACCTGGAGACAGTCC 
CTCC^CTGTGAACAAGCTTTTGCAGCTTCCCAGCACGACCATTGAAAATATCTCTGTGTCTG 
TCCACCAGCCACAGCCCAAACACATCAAACTTGCTAAGCGGCGGATACCCCCAGCTTCTAAG 
ATCC CAG CTTCTGCAGTGGAAATG CCTGGTT CAGCAGATG TCACAGGATT AAATGTGCAGTT 
TGGGGCTCTGG AATTTGG GT CAGAAC CTTC TCTCT CTGAATTTGGAT CAG C TCCAAGCAGTG 
AAAATAGTAAT CAGATTC CCATCAGCTTGTATT CGAAGTCTTTAAGTGAGC CTTTGAATACA 
TCTTTATCAATG AC CAGTGC AGTACAGAACTC CACATATACAACTT C CGTCATTAC CT C CTG 
CAG T C T GAC AAG CT CAT CAC TG AATT CT GC T AG T C CAG T AGC AATGT CT T C CT CTT ATGA C C 
AG AG TT CTGTGCATAACAGG ATC C CAT ACCAAAG CCCTGTGAGTTCAT C AGAGTCAGCTCCA 
GGAA CCAT C ATGAATGGACATGGTGGTGGT CGAAGT CAGCAGACACTAGACAGTAAGTATAG 
CAGCAAGCTA CTCT TGTCATGGCTGGTGCCAAC CAAAC AG AG GAAGAGGAT AGCTCACGTGA 
TGTGGAAAACACCAGTTGGTCAATGGCTC^TTCGTIAAAAAGCAGCCCTTTTGCTTTTTTGT 
TTTTGGACCAGGTGTTGGCTGTGGTGTTATTAGAAATGTCTTAACCACAGCAAGAAGGAGGT 
GGTGGTCTCATATTCTTCTGCCCTAATCAGACTGCACCACAAGTGCAGCATACAGTATGCAT 
TTTAAAGATGCTTGGGCCAGGCGGGGTGGCTGATGCCCATAATCCCAGTGCTTTGGGGGGCC 
AAGGCAGGCAGATTGC C CAAGCT CAGGAGTTTGAGAC CAC C C TGGGCAACAT GGTGAAACTC 
TGTCTCTACTAAAATACGAAAAACTAGCCGGGTGTGGTGGCGGCGCGTGCCTGTAATCCCAG 
CTACTTGGGAGG CTGAGG CACAAG AATC GCTTGAGCCAG CTTGGGCTACAAAGTGAGA CTCC 
GTCTGAAAAGA 
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FIGURE 44 

MCFKALGOTSVLLRICSFIPLLKSSVMSGFGELAPPKMANITSSQILDQLKAPSLGQFTTT 
PSTQQNSTSHPTTTTSWDLKPPTSQSSVLSHLDFKSQPEPSPVLSQLSQRQQHQSQAVTVPP 
PGLESFPSQAKLRESTPGDSPSTVNKLLQLPSTTIENISVSVHQPQPKHIKLAKRRIPPASK 
IPASAVEMPGSADVTGLNVQFGALEFGSEPSLSEFGSAPSSENSNQIPISLYSKSLSEPLNT 
SLSMTSAVQNSTYTTSVITSCSLTSSSLNSASPVAMSSSYDQSSVHNRIPYQSPVSSSESAP 
GT IMNGHGGGRSQQTLDS KYS SKLLLSWLVPTKQRKRI AHVMWKTPVGQWL IR 

Signal peptide: 
amino acids 1-24 



M/270 
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FIGURE 45 

GCCGAGTGGGACAAAGCCTGGGGCTGGGCGGGGGCCATQGCGCTGCCATCCCGAATCCTGCT 

TTGGAAACTTGTGCTTCTGCAGAGCTCTGCTGTTCTCCTGCACTCAGCGGTGGAGGAGACGG 

ACGCGGGGCTGTACACCTGCAACCTGCACCATCACTACTGCCACCTCTACGAGAGCCTGGCC 

GTCCGCCTGGAGGTCACCGACGGCCCCCCGGCCACCCCCGCCTACTGGGACGGCGAGAAGGA 

GGTGCTGGCGGTGGCGCGCGGCGCACCCGCGCTTCTGACCTGCGTGAACCGCGGGCACGTGT 

GGACCGACCGGCACGTGGAGGAGGCTCAACAGGTGGTGCACTGGGACCGGCAGCCGCCCGGG 

GTCCCGCACGACCGCGCGGACCGCCTGCTGGACCTCTACGCGTCGGGCGAGCGCCGCGCCTA 

CGGGCCCCTTTTTCTGCGCGACCGCGTGGCTGTGGGCGCGGATGCCTTTGAGCGCGGTGACT 

TCTCACTGCGTATCGAGCCGCTGGAGGTCGCCGACGAGGGCACCTACTCCTGCCACCTGCAC. 

CACCATTACTGTGGCCTGCACGAACGCCGCGTCTTCCACCTGACGGTCGCCGAACCCCACGC 

GGAGCCGCCCCCCCGGGGCTCTCCGGGCAACGGCTCCAGCCACAGCGGCGCCCCAGGCCCAG 

AC CC CACACTGG CGCG CGG C C ACAACGT CAT CAATGTCAT CGTC CCCGAGAGCCGAGC CC AC 

TT CTTC CAGCAG CT GGGCTACGTG CTGGCCACGCTGCTGCTCTT CATCCTG CT A CTGGTC AC 

TGTCCTCCTGGCCGCCCGCAGGCGCCGCGGAGGCTACGAATACTCGGACCAGAAGTCGGGAA 

AGTCAAAGGGGAAGGATGTTAACTTGGCGGAGTTCGCTGTGGCTGCAGGGGACCAGATGCTT 

TACAGG AGTG AG GACATCCAGCTAGAT TACAAAAACAACAT C CTGAAGGAGAGGGCGGAG CT 

GGCCCACAGCCCCCTGCCTGCCAAGTACATCGACCTAGACAAAGGGTTCCGGAAGGAGAACT 

GCAAATMGGAGGCCCTGGGCTCCTGGCTGGGCCAGCAGCTGCACCTCTCCTGTCTGTGCTC 

CTCGGGGCATCTCCTGATGCTCCGGGGCTCACCCCCCTTCCAGCGGCTGGTCCCGCTTTCCT 

GGAATTTGGCCTGGGCGTATGCAGAGGCCGCCTCCACACCCCTCCCCCAGGGGCTTGGTGGC 

AGCATAGCCCCCACCCCTGCGGCCTTTGCTCACGGGTGGCCCTGCCCACCCCTGGCACAACC 

AAAATCCCACTGATGCCCATCATGCCCTCAGACCCTTCTGGGCTCTGCCCGCTGGGGGCCTG 

AAGACATTC CTGGAGGACACTC CCAT CAGAAC CTGG CAGCCC CAAAAC TGGGGT CAGC CTCA 

GGGCAGGAGTCCCACTCCTCCAGGGCTCTGCTCGTCCGGGGCTGGGAGATGTTCCTGGAGGA 

GGACACT C CCATCAGAACTTGGCAGCCTTGAAGTTG GGGT CAGC CTCGGCAGGAGTCCCACT 

CCTCCTGGGGTGCTGCCTGCCACCAAGAGCTCCCCCACCTGTACCACCATGTGGGACTCCAG 

CTTTGGGCCACCTGGGGCTGCACCCCCTGCCCTTTCTCTGCCCCATCCCTACCCTAGCCTTG 
CTCTCAGCCACCTTGATAGTCACTGGGCTCCCTGTGACTTCTGACCCTGACACCCCTCCCTT 
GGACTCTGCCTGGGCTGGAGTCTAGGGCTGGGGCTACATTTGGCTTCTGTACTGGCTGAGGA 
CAGGGGAGGGAGTGAAGTTGGTTTGGGGTGGCCTGTGTTGCCACTCTCAGCACCCCACATTT 
GCATCTGCTGGTGGACCTGCCACCATCACAATAAAGTCCCCATCTGATTTTTAAAAAAAAAA 
AAAAA 



WO 00/12708 



PCT/US99/20111 



FIGURE 46 

< /us r / seqdb2 / s a t / DNA/Dnaseqs . min/ s s . DNA6 0 6 1 8 
oubunit 1 of 1, 341 aa, 1 stop 
<MW: 38070, pi: 6.88, NX(S/T): 1 

MALPSRI LLWKLVLLQSS AVLLHS AVEETDAGLYTCNLHHH YCHLYES LAVRLEVTDGPPAT 
PAYWDGEKEVLAVARGAPALLTCVNRGHWTDRHVEEAQQVVHTO^ 

YASGERRAYGPLFLRDRVAVGADAFERGDFSLRIEPLEVADEGTYSCHLHHHYCGLHERRVF 
HLTVAE PHAEPP PRGS PGNGS SHSGAPGPDPTLARGHNVINVI VPESRAHFFQQLGYVLATL 
LLF ILLLVTT7LIJUtflRRRGGYEYSDQKSG 
NILKERAELAHSPLPAKYIDLDKGFRKENCK 

Important features: 
Signal peptide: 

amino acids 1-19 

Transmembrane domain: 

amino acids 237-262 

N-glycoaylation site. 

amino acids 205-208 

Cell attachment sequence. 

amino acids 151-154 

Coproporphyrinogen III oxidase proteins. 

amino acids 115-140 
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FIGURE 47 

CGCCGGAGGCAGCGGCGGCGTGGCGCAGCGGCGACATGGCCGTTGTCTCAGAGGACGACTTT 

CAGCACAGTTCAAACTCCACCTACGGAACCACAAGCAG CAGTCT CC GAGCTGACCAGGAGGC 

ACTGCTTGAGAAGCTGCTGGACCGCCCGCCCCCTGGCCTGCAGAGGCCCGAGGACCGCTTCT 

GTGGCACATACATCATCTTCTTCAGCCTGGGCATTGGCAGTCTACTGCCATGGAACTTCTTT 

ATCACTGCCAAGGAGTACTGGATGTTCAAACTCCGCAACTCCTCCAGCCCAGCCACCGGGGA 

GGACCCTGAGGGCTCAGACATCCTGAACTACTTTGAGAGCTACCTTGCCGTTGCCTCCACCG 

TGCCCTCCATGCTGTGCCTGGTGGCCAACTTCCTGCTTGTCAACAGGGTTGCAGTCCACATC 

CGTGTCCTGGCCTCACTGACGGTCATCCTGGCCATCTTCATGGTGATAACTGCACTGGTGAA 

GGTGGACACTTCCTCCTGGACCCGTGGTTTTTTTGCGGTCACCATTGTCTGCATGGTGATCC 

TCAGCGGTGCCTCCACTGTCTTCAGCAGCAGCATCTACGGCATGACCGGCTCCTTTCCTATG 

AGGAACTCCCAAGCACTGATATCAGGAGGAGCCATGGGCGGGACGGTCAGCGCCGTGGCCTC 

ATTGGTGGACTTGGCTGCATCCAGTGATGTGAGGAACAGCGCCCTGGCCTTCTTCCTGACGG 

CCACCATCTTCCTCGTGCTCTGCATGGGACTCTACCTGCTGCTGTCCAGGCTGGAGTATGCC 

AGGTACTACATGAGGCCTGTTCTTGCGGCCCATGTGTTTTCTGGTGAAGAGGAGCTTCCCCA 

GGACTCCCTCAGTGCCCCTTCGGTGGCCTCCAGATTCATTGATTCCCACACACCCCCTCTCC 

GCCCCATCCTGAAGAAGACGGCCAGCCTGGGCTTCTGTGTCACCTACGTCTTCTTCATCACC 

AGCCTCATCTACCCCGCCGTCTGCACCAACATCGAGTCCCTCAACAAGGGCTCGGGCTCACT 

GTGGACCACCAAGTTTTTCATCCCCCTCACTACCTTCCTCCTGTACAACTTTGCTGACCTAT 

GTGGCCGGCAGCTCACCGCCTGGATCCAGGTGCCAGGGCCCAACAGCAAGGCGCTCCCAGGG 

TTCGTGCTCCTCCGGACCTGCCTCATCCCCCTCTTCGTGCTCTGTAACTACCAGCCCCGCGT 

CCACCTGAAGACTGTGGTCTTCCAGTCCGATGTGTACCCCGCACTCCTCAGCTCCCTGCTGG 

GGCTCAGCAACGGCTACCTCAGCACCCTGGCCCTCCTCTACGGGCCTAAGATTGTGCCCAGG 

GAGCTGGCT GAGG C CACG GGAGTGG TGATGTC CTTTTATGTGTG CTTGGGCTTAACACTGGG 

CTGAGCCTGCTCTACCCTCCTGGTGCACCTCATC2&SAAGGGAGGACACAAGGACATTGGTG 

CTTCAGAGCCTTTGAAGATGAGAAGAGAGTGCAGGAGGGCTGGGGGCCATGGAGGAAAGGCC 

TAAAGTTT CACTTGGGGAC AGAGAGCAGAG CACACT CGGGCCT CATCCCT CC CAAGATGCCA 

GTGAGCCACGTC CATGCC C ATTC CGTGC AAGG CAGATATT CCAGTCATATTAACAGAACACT 

C CTGAGACAGTTGAAGAAGAAATAGCACAAAT CAGGGGTACTCCCTTCACAGCTGATGGTTA 

ACATTCCACCTTCTTTCTAGCCCTTCAAAGATGCTGCCAGTGTTCGCCCTAGAGTTATTACA 

AAGCCAGTGCCAAAACCCAGCCATGGGCTCTTTGCAACCrCCCAGCTGC 

G ACAG C GAGAT G CAAG CAAATG CT CAG CTCT C CTT AC C C TGAAGGG GT CT CC CTGGAAT GGA 

AGTCCCCTGGCATGGTCAGTCCTCAGGCCCAAGACTCAAGTGTGCACAGACCCCTGTGTTCT 

GCGGGTGAACAACTGCCCACTAACCAGACTGGAAAACCCAGAAAGATGGGCCTTCCATGAAT 

GCTTCATTCCAGAGGGACCAGAGGGCCTCCCTGTGCAAGGGATCAAGCATGTCTGGCCTGGG 

TTTTCAAAAAAAGAGGGATCCTCATGACCTGGTGGTCTATGGCCTGGGTCAAGATGAGGGTC 

TTTCAGTGTTCCTGTTTACAACATGTCAAAGCCATTGGTTCAAGGGCGTAATAAATAC 

GTATTCAAAAA 
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FIGURE 48 

MAWSEDDFQHSSNSTyGTTSSSLRADQEALLEKLLDRPPPGLQRPEDRFCGTYIIFFSLGI 
GSLLPWNFFITAKEYWMFKLRNSSSPATG3DPEGSDILNYFESYLAVASTVPSMLCLVANFL 
LVNRVAVHIRVLASLWILAIFMVITALVKVDTSSWTRGFFAVTIVCMVILSGASTVFSSSI 
YGMTGSF PMRNSQAL I SGGAMGGTVS AVAS LVDLAAS SDVRNS ALAFFLTAT I FLVLCMGLY 
LLLSRLEYARYYMRPVLAAHWSGEEELPQDSLSAPSVASRFIDSHTPPLRPILKKTASLGF 
CVTYVFFITSLIYPAVCTNIESLNKGSGSLWTTKFFIPLTTFLLYNFADLCGRQLTAWIQVP 
GPNSKALPGFVLLRTCLIPLFVLCNYQPRVHLKTVVFQSDVYPALLSSLLGLSNGYLSTLAL 
LYGPKIVPRELAEATGWMSFYVCLGLTLGSACSTLLVHLI 

Transmembrane domain: 

amino acids 50-74 (type II), 105-127, 135-153, 163-183, 228-252, 
305-330, 448-472 
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FIGURE 49 

GACAGTGGAGGG CAGTGGAGAGGACCG CGC TG T CCTGCTGT C AC CAAG AGCTGG AGACACCA 

TCTCCCACCGAGAGTC^ISGCCCCATTGGCCCTGCACCTCCTCGTCCTCGTCCCCATCCTCC 

TCAGCCTGGTGGCCTCCCAGGACTGGAAGGCTGAACGCAGCCAAGACCC CTT CGAGAAATGC 

ATGCAGGATCCTGACTATGAGCAGCTGCTCAAGGTGGTGACCTGGGGGCTCAATCGGACCCT 

GAAGCCCCAGAGGGTGATTGTGGTTGGCGCTGGTGTGGCCGGGCTGGTGGCCGCCAAGGTGC 

TCAGCGATGCTGGACACAAGGTCACCATCCTGGAGGCAGATAACAGGATCGGGGGCCGCATC 

TTCACCTACCGGGACCAGAACACGGGCTGGATTGGGGAGCTGGGAGCCATGCGCATGCCCAG 

CTCTCACAGGATCCTCCACAAGCTCTGCCAGGGCCTGGGGCTCAACCTGACCAAGTTCACCC 

AGTACGACAAGAACACGTGGACGGAGGTGCACGAAGTGAAGCTGCGCAACTATGTGGTGGAG 

AAGGTGCCCGAGAAGCTGGGCTACGCCTTGCGTCCCCAGGAAAAGGGCCACTCGCCCGAAGA 

CATCTACCAGATGGCTCTCAACC^GGCCCTCAAAGACCrrCAAGGC^CTGGGCTGCAGAAAGG 

CG ATG AAG AAGTTT GAAAGGCACACGCT CTTGGAAT AT CTTCTCGG GGAGGGGAAC CTGAGC 

CGGCCGGCCGTGCAGCTTCTGGGAGACGTGATGTCCGAGGATGGCTTCTTCTATCTCAGCTT 

CGCCGAGGCCCTCCGGGCCCACAGCTGCCTCAGCGACAGACTCCAGTACAGCCGCATCGTGG 

GTGGCTGGGACCTGCTG C CG CG CGCG CTG CTGAG CT CG CTGT C CGGGCTTGTGC TGTTGAAC 

GCGCCCGTGGTGGCGATGACCCAGGGACCGCACGATGTGCACGTGCAGATCGAGACCTCTCC 

CCCGGCGCGGAATCTGAAGGTGCTGAAGGCCGACGTGGTGCTGCTGACGGCGAGCGGACCGG 

CGGTGAAGCGCATCACCTTCTCGCCGCCGCTGCCCCGCCACATGCAGGAGGCGCTGCGGAGG 

CTGCACTACGTGCCGGCCACCAAGGTGTTCCTAAGCTTCCGCAGGCCCTTCTGGCGCGAGGA 

GCACATTGAAGGCGGCCACTCAAACACCGATCGCCCGTCGCGCATGATTTTCTACCCGCCGC 

CGCGCGAGGGCGCGCTGCTGCTGGCCTCGTACACGTGGTCGGACGCGGCGGCAGCGTTCGCC 

GGCTTGAGCCGGGAAGAGGCGTTGCGCTTGGCGCTCGACGACGTGGCGGCATTGCACGGGCC 

TGTCGTGCGCCAGCTCTGGGACGGCACCGGCGTCGTCAAGCGTTGGGCGGAGGACCAGCACA 

GCCAGGGTGGCTTTGTGGTACAGCCGCCGGCGCTCTGGCAAACCGAAAAGGATGACTGGACG 

GTCCCTTATGGCCGCATCTACTTTGCCGGCGAGCACACCGCCTACCCGCACGGCTGGGTGGA 

GACGGCGGTCAAGTCGGCGCTGCGCGCCGCCATCAAGATCAACAGCCGGAAGGGGCCTGCAT 

CGGACACGGCCAGCCCCGAGGGGCACGCATCTGACATGGAGGGGCAGGGGCATGTGCATGGG 

GTGGCCAGCAGCCCCTCGCATGACCTGGCAAAGGAAGAAGGCAGCCACCCTCCAGTCCAAGG 

CCAGTTAT CTCTCCAAAACACG AC CCACACGAGG AC CTCGCATTAAAGTATTTTCGGAAAAA 

AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 



q<j /X70 
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FIGURE 50 

MAPKMiHLLVLVPILLSLVASQDW^ 

I WGAGVAGLVAAKVLSDAGHKVTILEADNRIGGRI FT YRDQNTGW IGELGAMRMPSSHRI L 

HKLCQGLGLNLTKFTQYDKNTWTEVHEVKLRimA^EKVPEKLGYALRPQSKGHSPEDIYQ^ 

I^QALKDLKALGCRKAMKKFERHTLLEYIiLGEGNLSRPAVQLLGDVMSEDG 

AHSCLSDRLQYSRI VGGWDLLPRALLSSLSGLVLLNAPVVAMTQGPHDVHVQ IETS PPARML 

KVLKADVVLLTASGPAVKRI TFSPPLPRHMQEALRRLHYVPATKVFLSFRRPFWREEHI EGG 

HSNTDRPSRMIFYPPPREGALLIJ^YTWSDAAAAFAGLSREEAIiRLALDDVAALHGPVWQ 

WDGTGWKRWAEDQHSQGGFWQPPALWQTEKDDWTVPYGRIYFAGEHTAYPHGWVETAVKS 

ALRAAIKINSRKGPASDTASPEGHASDMEGQGHVHGVASSPSHDLAXEEGSHPPVQGQLSLQ 
NTTHTRTSH 

Signal peptide: 

amino acids 1-21 
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FIGURE S3 

CTGACATGGCCTGACTCGGGACAGCTCAGAGCAGGGCAGAACTGGGGACACTCTGGGCCGGCCTTCTG 

CCTGCA^GACGCTCTGAAGCCACCCTGTCTCTGGAGGAACCACGAGCGAGGGAAGAAGGACAGGGAC 

TCGTGTGGCAGGAAGAACTCAGAGCCGGGAAGCCCCCATTCACTAGAAGCACTGAGAGATGCGGCCCC 

CTCGCAGGGTCTGAATTTCCTGCTGCTGTTCACAAAGATGCTTTTTATCTTTAAC^ 

CACTTCCGACCCCGGCGTTGATCTGCATCCTGACATTTGGAGCTGCCATCTTCTTGTGGCTGATCArc 

AGACCTCAACCCGTCTTACCTCTTCTTGACCTGAACAAT CAGT CTGTGGGAAT TGAGGGAGGAGCACG 

AGGTTTTCCAAAGAGGACTCGCTGTGT CTGACAATGGGC CCTGCTTGGGATATAGAAAACCAAACCAG 
C CCTACAG ATGG CTATCTTACAAACAGGTGTCTGATAGAGCAGAGTACCTGGGTTCCTGT CT CTTGCA 
TAAAGGTTATAAATCATCACCAGAC CAGT TTGTCGGCATCTTTGCTCAGAATAGGC CAGAGTGGATCA 
T CT C CG AATTGGCTTGTT ACACGTACTCZTATGGTAGCTGTACCTCTGTATGACACCTTGGGACCAGAA 
G CCATCGTACATATTGTCAACAAGGCTGATATCGCCATGGTGATCTGTGACACACC CCAAAAGGCAT^ 
GGTGCTGATAGGGAATGTAGAGAAAGGCTTCACCCCGAGCCTGAAGGTGATCATCCTTATGGACCCCT 
TTGATGATGACCTGAAGCAAAGAGGGGAGAAGAGTGGAATTGAGATCTTATCCCTATATGATGCTGAG 
AACCTAGGCAAAGAGCACTTC^GAAAACCTGTGCCTCCTAGCCCAGAAGACCTGAGCGTCATCTGCTT 
CACCAGTGGGACCACAGGTGACCCCAAAGGAGCCATGATAACCCATCAAAATATTGTT^ 
CTGCCTTTCTCAAATGTGTGGAGCATGCTTATGAGC CCACTC CTGATGATGTGGC CATAT CCTACCTC 
CCTCTGGCTC AT ATGTTTGAGAGGATTGTACAGG CTGTTGTGTACAGCTGTGGAG CCAGAGTTGGATT 
CTTCCAAGGGGATATTCGGTTGCTGGCTGACGACATGAAGACTTTC 

TGCCTCGACTCCTTAACaGGATCTACGATAAGGTACAAAATGAGGCCAAGACACCCTTGAAGAAGTTC 
TTGTTGAAGCTGGCTGTTTCCAGTAAATTC^lAAGAGCrTCAAAAGGGTATCATCAGGCATGA 
CTGGGACAAG CTCATCTTTG CAAAGATCCAGGACAGCCTGGGCGGAAGGGTTCGTGTAATTGTCACTG 
GAGCTGC C CCCATGTCCACTTCAGTCATGACATT CTTCCGGGCAGCAATGGGATGTCAGGTGTATGAA 
GCTTATGGTCAAACAGAATGCACAGGTGGCTGTACATTT 

CGTTGGGGTGCCCCTGGCTTGCAATTACGTGAAGCTGGAAGATGTGGCTGACATGAACTACTTTAC^ 
TGAATAATGAAGGAGAGGT CTGCATCAAGGGTACAAACGTGTTCAAAGGATAC CTGAAGGACC CTGAG 
AAGACACAGGAAGCCCTGGACAGTGATGGCTGGCTTCACACAGGAGACATTGGTCGCTGGCTCCCGAA 
TGGAACTCTGAAGATCAT CGACCGTAAAAAGAACATTTTCAAGCTGGCC CAAGGAGAATACATTGCAC 
C AGAGAAG AT AG AAAATATCT ACAACAGGAGT C AAC CAGTGTT AGAAATTTTTGT ACACG GGGAG AG C 
TTACGGTCATCCTTAGTAGGAGTGGTGGTTCCTGACACAGATGTACTTCCCTCATTTGCAGC 
TGGGGTGAAGGG CT CCITTGAGGAACTGTGCCAAAACCAAGTTGTAAGGGAA 

TGCAGAAAATTGGGAAAGAAAGTGGCCTT AAAACTTTTGAACAGGTCAAAG CCATTTTT CTTCATCCA 

GAG C CATT TT C CATTGAAAATGGGC TC TTG ACAC CAACATTGAAAGCAAAGCGAGGAG AGCT TT C CAA 

AT ACTTT CGGACC CAAATTG ACAG C C TG T ATG AG CACAT C CAGGATTAGG AT AAGGTAC TTAAGTAC C 

TGCCGGCCCACTGTGCACTGCTTCTGAGAAAATGGATTAAAAACT 

C CT C CTATTTTTTTTT AACCT GTTAAACT CT AAAG CCATAGC TTTTGTTT^ 

GTGTAAACTTAGTTCCCAAATAAATC^TCCTGTCTTTCCCATCTTCGATGTTGCT 

TCAC^CTACTTTTATCAACATGCCTGT^ 

TTTCCAACCTTAATACTATTAGTAACCACAAGTTCAAGG<3TCAAAGG^ 
TGTTITGTGATAAACATAACTTGCCAAGA.GTCTCTATGCTTATTTAC^ 
GAGATTTTTAAATTCTGAAAAACTGCTTACAATTCATGTT 
TTTAGTTTTAGCCTATCACTCATGTCAATCATATCTATGAGACAAATGTCT 

AAATT AAATTG TGTACTGAAGGGAAAAGTTTG ATCATAC CAAAC ATTT C CT AAACTCTCTAGT T AGAT 
ATCTGACTTGGGAGTATTAAAAATTGGGTCTATGACATACTGTCCAAAAGGAATGCTGTTCTTAAAGC 
ATTATTTACAGTAGGAACTGGGGAGTAAATCTGTTCCCTAC^GTTTGCTGCTGAGCTGGAAGCTGTGG 
GGGAAGGAGTTGACAGGTGGGCCCAGTGAACTTTTCC^GTAAATGAAGCAAGCACTGAATAAAAACCT 
CCTGAAC TGGGAACAAAGATCTAC AGGC AAGCAAGATGCC CACACAACAGG CTTATTTTCTGTGAAGG 
AAC CAACTGATCTCCCC CACCCTTGGATTAG AGTTCCTGCTCTACCTTAC CCACAGATAAC ACATGTT 
GTTTCTAC TT GT AAATGT AAAGT CTTT AAAATAAACT ATT ACAGATAAAAAA 



t 
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FIGURE 52 

</usr/seqdb2/sst/DNA/Dnaseqs,min/ss.DNA60775 
<subunit 1 of 1, 739 aa, 1 stop 
<MW: 82263, pi; 7.55, NX(S/T): 3 

MDALKPPCLWRNHERGKKDRDSCGRKNSEPGSPHSLEALRDAAPSQGLNFLLLFTKMLFIFN 
FLFS PLPTPAL I CILTFGAAI FLWL I TRPQPVLPLLDLNNQS VGIEGGARKGVSQKNNDLTS 
CCFSDAKTMYEVFQRGLAVSDNGPCLGYRKPNQPYRWLSYKQVSDRAEYLGSCLLHKGYKSS 
PDQF VGI FAQNRPEWI I S ELACYTYSMVAVPLYDTLGPEAI VHI VNKAD IAMVI CDTPQKAL 
VLIGNVEKGFTPSLKVIILMDPFDDDLKQRGEKSGIEILSLYDAENLGKEHFRKPVPPSPED 
LSVICFTSGTTGDPKGAMITHQNIVSNAAAFLKCVEHAYEPTPDDVAISYLPLAHMFERIVQ 
AVVYSCGARVGFFQGDIRLLADDMKTLKPTLFPAVP^ 

VSSKFKELQKGIIRHDSFWDKLIFAKIQDSLGGRVRVIVTGAAPMSTSVMTFFRAAMGCQVY 
EAYGQTE CTGGCTFTL PGDWT S GHVG VP LACNYVKLED VADMNY FTVNNEGE VC I KGTNVF K 
GYLKDPEKTQEALDSDGWLHTGDIGRWLPNGTLKIIDRKKNIFKLAQGEYIAPEKIENIYNR 
SQPVLQIFVHGESLRSSLVGVWPDTDVLPSFAAKLGVKGSFEELCQNQWREAILEDLQKI 
GKESGLKTFEQVKAIFLHPEPFSIENGLLTPTLKAKRGELSKYFRTQIDSLYEHIQD 

Important features: 

Type II transmembrane domain; 

amino acids 61-80 

Putative AMP-binding domain signature. 

amino acids 314-325 

N-glycosylation site. 

amino acids 102-105, 588-591 and 619-622 
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FIGURE 53 

GGAGGCGGAGGCCGCGGCGAGCCGGGCCGAGCAGTGAGGGCCCTAGCGGGGCCCGAGCGGGG 
CCCGGGGCCCCTAAGCCATTCCTGAAGTCATGGGCTGGCCAGGACATTGGTGACCCGCCAAT 
CCGGTATGGACGACTGGAAGCCCAGCCCCCTCATCAAGCCCTTTGGGGCTCGGAAGAAGCGG 
AGCTGGTACCTTACCTGGAAGTATAAACTGACAAACCAGCGGGCCCTGCGGAGATTCTGTCA 
GACAGGGGCCGTGCTTTT CCTGCT GGTGAC TGTC ATTGT CAATATCAAGTTGAT CCTGGACA 
CTCGGCGAGCCATCAGTGAAGCCAATGAAGACCCAGAGCCAGAGCAAGACTATGATGAGGCC 
CTAGGC CGC CTGGAGC CC C CACGGCG CAGAGG CAGTGGTC CC CG GC GGGT C CTGGACGTAGA 
GGTGTATT CAAGTCGCAGCAAAGTATATGTGGCAGTGGATGG CACCACGGTGCTGGAGGATG 
AGGCCCGGGAGCAGGGCCGGGGCATCCATGTCATTGTCCTCAACCAGGCCACGGGCCACGTG 
ATGGCAAAACGTGTGTTTGACACGTACTCACCTCATGAGGATGAGGCCATGGTGCTATTCCT 
CAACATGGTAGCGCCCGGCCGAGTGCTCArCTGCACTGTCAAGGATGAGGGCTCCTTCCACC 
TCAAGGACACAGCCAAGGCTCTGCTGAGGAGCCTGGGCAGCCAGGCTGGCCCTGCCCTGGGC 
TGGAGGGACACATGGGCCTTCGTGGGACGAAAAGGAGGTCCTGTCTTCGGGGAGAAACATTC 
TAAGTCACCTGCCCTCTCTTCCTGGGGGGACCCAGTCCTGCTGAAGACAGATGTGCCATTGA 
G CT CAG CAGAAG AGGC AG AGTGCCACT GGGCAGACACAGAGCTGAACCGTCG C CGC CGGCGC 
TTCTGCAGC^AAGTTGAGGGCTATGGAAGTGTATGCAGCTGCAAGGACCCCACACCCATCGA 
GTTCAGCCCTGACCCACTCCCAGACAACAAGGTCCTCAATGTGCCTGTGGCTGTCATTGCAG 
GGAACCGACCCAATTACCTGTACAGGATGCTGCGCTCTCTGCTTTCAGCCCAGGGGGTGTCT 
CCTCAGATGATAACAGTTTTCATTGACGGCTACTATGAGGAACCCATGGATGTGGTGGCACT 
GTTTGGTCTGAGGGGCATC CAG CATACT CC CATCAGCAT CAAGAATGC CCGCGTGT CT CAGC 
ACTAC^VGGCCAGCCTCACTGCCACTTTCAACCTGTTTCCGGAGGCCAAGTTTGCTGTGGTT 
CTGGAAGAGGACCTGGACATTGCTGTGGATTTTTTC^GTTTCCTGAGCCAATCC^TCC^CCr 
ACTGGAGGAGGATGACAGCCTGTACTGCATCTCTGCCTGGAATGACCAGGGGTATGAACACA 
CGGCTGAGGACCCAGCACTACTGTACCGTGTGGAGACCATGCCTGGGCTGGGCTGGGTGCTC 
AGGAGGTCCTTGTACAAGGAGGAGCTTGAGCCCAAGTGGCCTACACCGGAAAAGCTCTGGGA 
TTGGGACATGTGGATGCGGATGCCTGAACAACGCCGGGGCCGAGAGTGCATCATCCCTGACG 
TTTCCCGATCCTACCACTTTGGC^TCGTCGGCCTCAACATGAATGGCrACTTTCACGAGGCC 
TACTTCAAGAAGGACAAGTTCAACACGGTTCCAGGTGTCCAGCTCAGGAATGTGGACAGTCr 
GAAG AAAG AAGCTTATGAAGTGGAAGTT CACAGGCTGCT CAGTGAGGCTGAGGTT CTGGAC C 
ACAGCAAGAACCCTTGTGAAGACTCTTTCCTGCCAGACACAGAGGGCCACACCTACGTGGCC 
TTTATTCG AATGGAGAAAGATGATGACTT CAC CACCTGGACCCAGCTTGC CAAGTG CCTCCA 
TATCTGGGACCTGGATGTGCGTGGCAACCATCGGGGCCTGTGGAGATTGTTTCGGAAGAAGA 
ACCACTTCCTGGTGGTGGGGGTCCCGGCTTCCCCCTACTCAGTGAAGAAGCCACCCTCAGTC 
ACCC CAATTTTCCTGGAGCCAC C CCCAAAGGAGGAGGGAGC CCCAGGAG CCC CAGAACAGAC 
ATGAGACCTC CT C CAGGACC CTGCGGGGCTGGGT ACTGTGT ACCCCCAGG CTGGCTAGCC CT 
TCCCTCCATCCTGTAGGATTTTGTAGATGCTGGTAGGGGCTGGGGCTACCTTGTTTTTAACA 
TGAGACTTAATTACTAACTCCAAGGGGAGGGTTC CC CTGCTCCAACACCCCGTT CCTGAGTT 
AAAAGT CTATTTATTTACTT CCTTGTTGGAGAAGGGCAGGAGAGTACCTGGGAAT CATT ACG 
ATCCCTAGCAGCTCATCCTGCCCTTTGAATACCCTCACTTTCCAGGCCTGGCTCAGAATCTA 
ACCTATTTATTGACTGTCCTGAGGGCCTTGAAAACAGGCCGAACCTGGAGGGCCTGGATTTC 
TTTTTGGGCTGGAATGCTGCCCTGAGGGTGGGGCTGGCTCTTACTCAGGAAACTGCTGTG.ee 
CAACCCATGGACAGGCCCAGCTGGGGCCCACATGCTGACACAGACTCACTCAGAGACCCTTA 
GACACTGGACCAGGCCTCCTCTCAGCCTTCTCTTTGTCCAGATTTCCAAAGCTGGATAAGTT 
GGTCATTGATTAAAAAAGGAGAAGCCCTCTGGGAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 54 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA6118 5 
xsubunit 1 of 1, 660 aa, 1 stop 
><MW: 75220, pi: 6.76, NX{S/T>: 0 

MDDWKPSPLIKPFGARKKRSWYLTWKYKLTNQRALRRFCQTGAVLFLLVTVIVNIKLILDTO 
RAISEANEDPEPEQDYDEALGRLEPPRRRGSGPRRVLDVEVYSSRSKVWAVDGTTVLEDEA 
REQGRGIHVIVLNQATGHVMAKRVFDTYSPHEDEAMVLFLNMVAPGRVLICTVKDEGSFHLK 
DTAKALLRSLGSQAGPALGWRDTWAFVGRKGGPVFGEKHSKSPALSSWGDPVLLKTDVPLSS 
AEEAECHWADTELNRRRRRFCSKVEGYGSVCSCKDPTPIEFSPDPLPDNKVLNVPVAVIAGN 
RPNYLYRMLRSLLSAQGVS PQMITVFTDGYYEEPMDWALFGLRG IQHTP I S I KNARVSQHY 
KASLTATFNLFPEAKFAVVLEEDLDIAVDFFSFLSQSIHLLEEDDSLYCISAWNDQGYEHTA 
EDPALLYRVETMPGLGWLRRSLYKEELEPKWPTPEKLWDWDMWMRMPEQRRGRECIIPDVS 
RSYHFGIVGLNMNGYFHEAYFKKHKFNTVPGVQLRNVDSLKK 

knpcedsflpdteghtyvafirmekdddft™tqlakclhiwdldvrgnhrglwrlfrkknh 
flwgvpaspysvkkppsvtpi flepppkeegapgapeqt 

Important features of the protein: 
Transmembrane domain: 

amino acids 38-55 

Homologous region to Mouse GNT1 

amino acids 229-660 
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FI GURE 55 

CGGACGCGTGGGCTGCTGGTGGGAAGGCCTAAAGAACTGGAAAGCCCACTCTCTTGGAA^ 
CTGTTTAAAGAACCTAAGCACCATTT^ 

AAGGAGGG CAGAATGGATGATTTCAT CTCCATTAG CCTGCT GTCTCTGGCTATGTTGGTGGGATGTTA 

CGTGG CCGGAATCAT TC C CTTGG CTGTTAATTTCTCAGAGGAACGACTGAAGCTGGTGACTGTTTTGG 

GTGCTGG C CTTCTCTGTGGAACTGCT CTGG CAGTCATCGTGCCTGAAGGAGTACATGCC CTTTATGAA 

GATATTCTTGAGGGAAAACACCACCAAGCAAGTGAAACACATAATGTGATTGCATCAGAC 

AG AAAAATCAGTTGTCCATGAACATGAGCACAG C CACGACCACACACAG CTGCATGCCTATATTGGTG 

TTTCCCTCGTTCTGGGCTTCGTTTTCATGTTGCTGGTGGACCAGATTGGTAACTCCCATG 

ACT G ACGAT C CAG AAG C AGCAAGGT CT AG CAATT CC AAAAT CAC CAC CACG C TGGGTCT GGTT GT C CA 

TGCTGCAGCTGATGGTGTTGCTTTGGGAGCAGCAGCATCTAOT 

TGTTTGTGGCAATCATGCTACATAAGGCACCAGCTGCTTTTGGACTGGTTTCCTTCT^ 

GG CTT AG AG C G G AAT CGAAT CAG AAAG CACTTGC TG GT CTTTGCATTGGCAG CAC CAGTTATGT C CAT 

GGTGACATACTTAGGACTGAGTAAC^GCAGTAAAGAAGCCCTTTCAGAGGTGAACGCCACGGGAGTGG 

CCATGCTTTT ^TCTGCC GGG ACATTT CTTTATG TTGCCACAGTACATGTCCTCC CTGAGGTGGGCGGA 

AT AGGG CACAGCCACAAGCCCGATGCC ACGGGAGGGAGAGG CCTCAG CCGC CTGGAAGTGGCAGC CCT 

GGTTCTGGGTTGCCTGATCCCTCTCATCCTGTCAGTAGGACACCAGCATTAAATGT 

CTTGGT CCAGGGCCGTTTGC CAT C CAGTG AGAACAGCCGGCACGTGACAGCTACT CACTTCCTCAGTC 

T CTTGTCT ^ c ^ T GCGClATCTCTACATGTATTCCrAGAGTC CAGAGGGGAGGTGAGGTTAAAACCTG 

AGTAATGGAAAAGCTTTTAGAGTAGAAACACATTTACGTTGCAGTTAGCTATAGACATCCCATTGTGT 

TATCTTTTAAAAGGCCCTTGACATTTTGCGTTTTAATATTTCTCTTAACCCTATTCTCAGGGA 

GAATTT AGTTTTAAGGAAAAG AGGAGAA CTT CATACT CACAATGAAAT AGTG AT T AT G AAAATACAGT 

GTTCTGTAATTAAGCTATGTCTCTTTCTTCTTAGTTTAGAG^ 

AACATGGTTCCCACCATGTAAGACTGGTC 

GCACCCACTCACTTAGATGCTAAAGGTGATTCTTAGTTAATCTGGGATTAGGGT^ 

AAGAC ACATTGAAAGC T CTCTT T AT A CT CAAAAGAGATATCCATTG AAAAGGGATGT CTAGAGGGATT 

TAAACAGCTCCTTTGGCACGTGCCTCTCTGAAT^ 

ACCT GT CT CCAC ATTC CT AG AG AGGAGCCAAGTT CTAGTAGTTT CAGTT CT AGG CTTTC CTT CAAGAA 
C AGTCAGAT CACAAAGTGT C TTTGG AAATT AAGGGAT AT T AAATTTTAAG TG ATTT TT GG ATGGTTAT 
TGATATCTTTGTAGTAGCTTTTTTTAAAAGACTACCAAAATGTATGGTTGTC 

TT TT TT TT TAAT TATTT CT C TTAGCAGAT CAGCAATC C CT CTAGG GAC CT AAATACTAGG T CAG CTTT 
GGCGACACTGTGTCTTTCTCACATAACCACCTGTAG 

TTGATTTAAAGCTTATTGGAAT CATGTCTCTTGT CTCTTCGTCTTTTCTTTGCTTT^CTTCTAACTTT 
TCCCTCTAGCC TCTCCTCGC ^CAATTTGCTGCTTACTG CTGGTGTTAATATITGTGTGGGATGAATT 
CTTATCAGGACAACCACTTCTCGAACTGTAATAATGAAGATAATAATATCTTTATTCTTTATCCCCTT 
C AAAG AAATT AC CTT T GTGT C AAATG C CGCTTTGT TGAGCC CTT AAAAT AC CAC CT C CTCATGT GT AA 

ATTTTTTTTTCATATTTGCCAAAATTTTTGTAAACCCTGTCTTGTCAAATAAGTGT^ 
TATTAATTTATTTTTACTTTCTATACCATTTCAAAACACATTA^ 

T CTT CAGGG CAGTGGAC GTAGTAGTTT GT AAAAAC G TT TT CT ATGA CG CAT AAG CT AG CATG C CT ATG 

AT TT AT TTCC TTCATG AATTTGTCACTGGATCAGCAGCTGTGGAAATAAAGCTTGTGAGC CCTCTGCT 

GGCCACAGTGAGGAAAGTAGCACAAATAGGATACAGTTGTATGTAGT<^TTGGCAACAATTC 

AT TTT ACTAC CAAG AGAAGG T AT AGT AT GG AAAG TC CAAATG ACTT C CTTGATTGGAT GTTAACAG CT 

GACTGGTGTGAGACTTGAGGTTTGATCTAGTCCTTCAAA 

AACTGACTTTGTCAAATAAATAGCAGATTGTAGTGTCAAAAAAAA 
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FIGURE 56 

MDDF IS I SLLSLAMLVGCYVAG 1 1 PLAVNFSEERLKLVTVLGAGLLCGTALAVI VPEGVHAL 
YEDILEGKHHQASETHNVIASDKAAEKSVVHEHEHSHDHTQLHAYIGVSLVLGFVFMLLVDQ 
IGNSHVHSTDDPEAARS SNS KI TTTLGLVVHAAADGVALGAAAS TSQTSVQL I VFVAIMLHK 
APAAFGLVSFLMHAGLERNRIRKHLLVPALAAPVMSMVTYLGLS KS SKEALSEVNATGYAML 
FSAGTFLYVATVHVLPEVGGIGHSHKPDATGGRGLSRLEVAALVLGCLIPLILSVGHQH 

Signal peptide: 

amino acids 1-18 

Transmembrane domain: 

amino acids 37-56, 106-122, 211-230, 240-260, 288-304 
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FIGURE 57 

GCTCGAGGCCGGCGGCGGCGGGAGAGCGACCCGGGCGGCCTCGTAGCGGGGCCCCGGATCCC 
CG AGTGGCGGCCGGAGC CTCGAAAAGAGATTCT CAGC G CTGATT TTGAGATGATGG GCTTGG 
GAAACGGGCGTCGCAGCATGAAGTCGCCGCCCCTCGTGCTGGCCGCCCTGGTGGCCTGCATC 
ATCGTCTTGGGCTTCAACTACTGGATTGCGAGCTCCCGGAGCGTGGACCTCCAGACACGGAT 
CATGGAGCTGGAAGGCAG GGT C CG CAGGGCGG CT G CAG AG AGAGG CGC CGTGGAGCTGAAGA 
AGAACGAGTT CC AGGGAGAG CTGGAGAAGCAG CGGGAGCAGC TTGACAAAATCCAGTCC AGC 
CACAACTT CCAG CTGGAGAG CGTCAACAAGCTGT ACCAGGACGAAAAGG CGGTTTTGGT GAA 
TAACATCACCAC AG G TGAGAGG CTCATC CG AGT GCTGCAAGACCAGTTAAAGACCCTGCAGA 
GGAATTAC GG CAGG CTGC AG CAGGATGT CCTCCAGTTT CAGAAGAAC CAGACCAACCTGG AG 
AGGAAGTTCTCCTACGACCTGAGCCAGTGCATCAATCAGATGAAGGAGGTGAAGGAACAGTG 
T GAG GAG CGAAT AG AAGAGGT CACC AAAAAGGGGAATGAAG CTGTAGCTT C CAGAGAC CTGA 
GTGAAAACAACGACCAGAGACAGCAGCT CCAAG C C C T CAGTG AG CCTCAGCC CAGGCTGCAG 
GCAGCAGG CCTGC CACACACAGAGGTGCCACAAGGGAAGGGAAACGTGCTTGGTAACAGCAA 
GTC CCAGACACCAGC CCCCAGTTC CGAAGTGGTTTTGGATT C AAAGAGACAAG TTGAG AAAG 
AGGAAACCAATGAGATCCAGGTGGTGAATGAGGAGC CT CAGAGGGACAGG CTGCCG CAGGAG 
C CAGG CCGGGAG CAGGTGGTGG AAGACAGACCTGTAGGTGGAAGAGGCTT CGGGGGAGCCGG 
AGAACT GGGC CAGACC CC ACAGGTGCAGGCTG C C CTGT CAGT GAGCCAGGAAAATCCAGAGA 
TGGAGGGC CCTGAGCGAGACCAGCTTGTCATCC CCGACGGACAGGAGGAGGAGCAGGAAGCT 
GCCGGGGAAGGGAGAAACCAGCAGAAACTGAGAGGAGAAGATGACTACAACATGGATGAAAA 
TGAAGCAGAATCTGAGACAGACAAGCAAGCAGCCCTGGC^GGGAATGACAGAAACATAGATG 
TT TTTAATGTTGAAGATC AGAAAAGAGACACCATAAATTTACTTGAT CAG CGTG AAAAGCGG 
AATCATACACTCTGAATTGAACTGGAATCACATATTTCACAACAGGGCCGAAGAGATGACTA 
TAAAATGTTCATGAGGGACTGAATACTGAAAACTGTGAAATGTACTAAATAAAATGT^ 
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FIGURE 58 

MMGLGNGRRSMKS P PLVLAALVAC 1 I VLGFNYWI ASSRS VDLQTR IMELEGRVRRAAAERGA 
VELKKNEFQGE^KQREQLDKIQSSHNFQLESVNKLYQDEKAVLVNNITTGERLIRVLQDQL 
KTLQRNYGRLQQDVLQFQKNQTNLERKFSYDLSQCINQMKEVKEQCEERIEEVTKKGNEAVA 
SRDLSENNDQRQQLQALSEPQPRLQAAGLPHTEVPQGKGNVLGNSKSQTPAPSSEWLDSKR 
QVEKEETNEIQWNEEPQRDRLPQEPGREQWEDRPVGGRGFGGAGELGQTPQVQAALSVSQ 
ENPEMEGPERDQLVIPDGQEEEQEAAGEGRNQQKLRGEDDYNMDENEAESETDKQAALAGND 
RNIDVFNVEDQKRDTINLLDQREKRNHTL 

Signal peptide: 

amino acids 1-29 
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FIGURE 59 

aSATGCAGAAAGCCTCAGTGTTC^ 
CCAGTGGCTTCCTGCTCACCOSTTTGGAGCTCA^^ 

TAGATGCTCTGCGATTTGACTT CGCC CAGCCCCAGCATTCACACGTGC CTAGAGAGCCTC CTGTCTCCCTACCCT 

TCCTGGGCAAACTAAGCTCCTTGCAGAGGATCCTGGAGATTCAGCCCCACCATGCCCGGCTCTACCGATCTCAGG 

TTGACCCTCCTACC^CCACCATGCAGCGCCTCAAGGCCCTCACCACTGGCTCACTGCCTACCTTTA 

GTAGTAACTTCGCCAGCCACGCCATAGTGGAAGACAATCTCATTAAGCAGCTCACCAGTGCAQ 

TCTTCATGGGAGATGATACCTGGAAAGACCTTTTCCCTGGTGCTTTCTCCAAAGCTTTCTTCT^ 

ATGTCAGAGACCTAGACACAGTGGACAATGGCATCCTGGAACACCTCTACCCCACC^ 

ACGTGCTOATTGCTCACTTCCTGGGTGTGGACCACTCT 

AGAAACTTAGCCAGATGGACCAGGTGATCCAGGGACT 

CTGGGGACCATGGGATGACCACAAATGGAGACCATGGAGGGGACAGTGAGCTGGAGGTCTCAGCTGCT 

TGTATAGCCCCACAGCAGTCTTCCCCAGCACCCCACCAGAGGAGCCAGAGGTGATTCCT^^ 

CCACGCTGGCCCTGCTGCTGGGCCTGCCCATCCCATTTGGGAATATCGGGGAAGTGATGGCTGAGCTATTCTC^ 

GGGGTGAGGACTCCCAGCCCCACTCCTCTGCTTTAGCCCAAGCCrrCAGCTCTC^ 

CCCGATTTCTTCATACCTACTCAGCTGCTACTCAGGAC 

TCTCCAAGGCCTCTGCTGACTACCAGTGGCTTCTCCAGAGCCCCAAGGGGGCTGAGGCGACACTC 

TTGCTGAGCTGCAGCAGTTCCTGCGGGGAGCTCGG3CCATGTGCATCGAGTCTTGGGCTCGTTTCTCTCTG 

GCATGGCGGGGGGTACTGCTCTCTTGGCTGCTTCCTCCTTTATCTGCCTGCTGGCATCTCAGTGGGC^VATATCCC 

CAGGCTTTCCATTCTGCCCTCTACTCCTGAC^CCTGTGGCCTGGGGCCTGGTTGGGGCCATAGCGTATGCTGGA 

TCCTGGGAACTATTGAGCTGAAGCTAGATCTAGTGCTTCTAGGGGCT 

rrCTGTGGAAAGCCTGGGCTGGCTGGGGGTCCAAGAGGCCCCTGGCAACCCTGTTTCCCATCCCTGGGCCCGTCC 

TGTTACTCCTGCTGTTTCGCTTGGCTGTGTTCTTCTCTGATAGTTTTGTTGTAGCTGAGGCCAGGGCCACCCCCT 

TCCTTTTGGGCTCATTCATCCTGCTCCTGGTTGTCCAGCTTCACTGGGAGGGCCAGCTGCTTCCAGCTAA 

TCACAATGCCCCGCCTTG^CACTTCAGCCACAACAAACCCCCCACGGCACAATGGTG 

GAATTGGGTTGCTTTTATGTACAAGGCTAGCTGGGCTTTTTCAT 

CCTCTCCCTGGCTGAGTCCTCTGGCATCCATGGTGGGTGGTCGAGCCAAGAATTTATGGTATGGAGCTTGTGTGG 

CGGCGCTGGTGGCCCTGTTAGCTGCCGTGCGCTTGTGGCTTa3CCWCT^ 

CCATGCTCTTTGTGCGCTGGGGACTGCCCCTAATG^ 

CAGATGAGGCTCCCCCCCGTCTCCGGGTCCTGGTCTCTGGGGCATCCATGGTGCTGCC^ 
TGGCTGCTTCAGGGCTCGCGCTGCTGCTCT^ 

GGACCAGGACTGTCCTCACTCCCTTCTCAGGCCCCCCCACTTCTCAAGC^^ 

TCTACCGACACATGCAGGAGGAGTTCCGGG^KXIGGTTAGAGAGGACCAAATCT 

CTTATCAGTTGGGGAGTGTCTACTCAGCTGCTATGGTCACAGCCCTCACCCTGTTG^ 

TGCATGCGGAGCGCATCAGCCTTGTGTTCCTGCTTCTGTTTCTGCAGAGCTTCCTTCTCCTACATCT 

CTGGGATACCCGTCACCACCCCTGGTCCTTTTACT 

CAC^^CCTTCTACTCCACAGGCCACCAGCCTC^ 

C^GAGGGTCATGGCTCCTGTACTTGGCTGCCTGCTTTGCTAGTGGGAGCCAACACCTTTGCCTCCCACCTCCTCT 
TTGCAGT AGGTTGCCCACTGCTCCTGCTCTGGCCTTTCCTGTGTGAGAGTCAAGGGCTC 
CCCCAGGGAATGAAGCTGATGCCAGAGTCAGACCCGAGGAGGAAGAGGAGCGACTGATGGAGATGCGGCT 
ATGCGCCTCAGCACTTCTATGCAGCACTGCTGCAGCTGGGCCTCAAGTACCTCTT^ 

TTGAGGCTGTGGGCTTCATTGTGAGCAGCGTGGGACTTCTCCTGGGCATAGCTTT^ 

CTG TGAG CT C C TGGTTC AGG CAG CTATTTCTGGC C CAGCAGAGGTAGCCTAGT CTGTG ATTACTGGCACTTGGCT 
ACAGAGAGTGCTGGAGAACAGTGTAGCCTGGCCTGTACAGGTA^ 

TCTTACTATCATGCAGCCAGGGGCCGCTGACATCTAGGACTTCATTATTCTATAATTCAGGACCACAGTGGAGTA 

TGAT CCCTAACTCCTGATTTGGATGCATCIX3AGGGACAAGGGGGGCGGTCT CCGG 

GCGTGGTGACTTGGACCTATAATCCCAGCACTTTGGGAGGCAGAGGTGGGAGGATTC 

AGAC CAGC CTGTGGAACATAACAAGACCCCGT CTCTAC TATTT AAAAAAAAGTG TAATAAAATGAT AATAT 
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FIGURE fin 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA62809 
<subunit 1 of 1, 1089 aa, 1 stop 
<MW: 118699, pi: 8.49, NX(S/T): 2 

MQKASVLLFLAWVCFLFYAGIALFTSGFLLTRLELTNHSSCQEPPGPGSLPWGSQGKPGACW 
MASRFSRWLVLIDALRFDFAQPQHSHVPREPPVSLPFLGKLSSLQRILEIQPHHARLYRSQ 
VD P PTTTMQRLKALTT GS LPTF I D AGS NFASHAI VEDNL I KQLTS AGRR WFMGD DTWKD L F 

PGAFSKAFFFPSFNVRDI^TVDNGILEHLYPTMDSGEWDVLIAHFLGVDHCGHKHGPHHPEM 
AKKLSQMDQVIQGLVERLENDTLLWAGDHGMTTNGDHGGDSELEVSAALFLYSPTAVFPST 
PPEEPEVI PQVSLVPTLALLLGLP I PFGKIGEVMAELFSGGEDSQPHSSALAQASALHLNAQ 
QVSRFLHTYSAATQDLQAKELHQLQNLFSKASADYQWLLQSPKGAEATLPTVIAELQOFLRG 
ARAMCIESWARFSLVRMAGGTALLAASCFICLLASQWAISPGFPFCPLIJjTPVAWGLVGAIA 
Y * G ^ GTIELK ^ L ^ GAV ^ 

WFSDSFWAEARATPFLLGSFILLLWQLHWEGQLLPPKLLTMPRLGTSATTNPPRHNGAY 
ALRLG I GLLL CTRLAGLFHRCPEETPVCHS S PWLS PLAS MVGGRAKNLWYGACVAALVAL LA 

™^ RRYG ^^ PEPPML ^^ 

RAVAGLAASGLALLLWKPVTVLVKAGAGAPRTRTVLTPFSGPPTSQADLDYWPQIYRHMOE 
EFR^RLERTKSQGPLTVAAYQLGSWSAAMVTALTLI^PI^LLHAERISLVFLLLFLQSFL 
m^^GIPVTTPGPFTVPWQAVSAWALMATQTFYSTGHQPVFPAIHWHAAFVGFPEGHGS 
^ P ^Y GANTFASmL ^^^ 

FIVSSVGLLLGIALVMRVDGAVSSWFRQLFLAQQR 

Important features : 
Signal peptide: 

amino acids 1-16 

Transmembrane domains: 

amino acids 317-341, 451-470, 481-500, 510-527, 538-555, 831-850, 
1016-1034, 1052-1070 



Leucine zipper pattern. 

amino acids 843-864 

N-glycosylation sites. 

amino acids 37-40, 268-271 



Co /Z-70 
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FIGURE 61 

TGCCGCTGCCGCCGCTGCTGCTGTTGCTCCTTCCGGCGCCTTGGGGACGGGCAGTTCCCTGT 
GTCTCTGGTGGTTTGCCTAAACCTGCAAACATCACCTTCTTATCCATCAACATGAAGAATGT 
CCTACAATGGACT C CACCAGAGGGT CTTCAAGGAGTTAAAGT TACTTACACTGTGC AGTATT 
TCATCACAAATTGGCCCACCAGAGGTGGCACTGACTACAGATGAGAAGTCCATTTCTGTTGT 
CCTGACAG CTCCAGAGAAGTGGAAGAGAAAT C CAGAAGAC CTTC C TGTTT C CATG CAACAAA 
TATACTCCAAT CTGAAGTAT AACGTGTCTGTGTTGAAT ACTAAAT CAAACAGAACGTGGT CC 
CAGTGTGTGACCAACCACACGCTGGTGCTCACCTGGCTGGAGCCGAACACTCTTTACTGCGT 
ACACGTGGAGTCCTTCGTCCCAGGGCCCCCTCGCCGTGCTCAGCCTTCTGAGAAGCAGTGTG 
CC AG GACT TTGAAAGATCAATC AT CAGAGTT CAAGGCTAAAAT CATCTTCTGGTAT GTTT TG 

CCCATATCTATTACCGTGTTTCTTTTTTCTGTGATGGGCTATTCCATCTACCGATATATCCA 
CGTT GG CAAAGAGAAACACC CAG CAAATTTGATTTTGATTTATGGAAATGAATTTGAC AAAA 
GATT CTTT GTG C CTGCTGAAAAAAT CGTGATTAACTTT AT CACC CT CAATATCT CGGATGAT 
TCTAAAAT TTCT CATCAGGATATGAGTTTACTGGGAAAAAG CAGTGATGTAT C CAG CCTTAA 
TGATCCTCAGC CCAGCGGGAACCTGAGG C CCC CT CAGGAGGAAGAGG AGGT G AAACATTTAG 
GGTATG CTTCG CATTTGATGGAAATTTTTTGTGACT CTGAAG AAAACACGGAAG GTACTT CT 
CT CACCCAGCAAGAGT C C CTCAGCAG AACAAT AC CCCCGG AT AAAACAGT CATTGAATATGA 
ATATGATGTCAGAACCACTGACATTTGTGCGGGGCCTGAAGAGCAGGAGCTCAGTTTGCAGG 
AGGAGGTGTCCACACAAGGAACATTATTGGAGTCGCAGGCAGCGTTGGCAGTCTTGGGCCCG 
CAAACGTTACAGTACT CATACA C CCCTCAG CT CCAAGACTTAGACC CC CTGGCGCAGGAG C A 

CACAGACTCGGAGGAGGGGCCGGAGGAAGAGCCATCGACGACCCTGGTCGACTGGGATCCCC 
AAACTGGCAGGCTGTGTATTCCTTCGCTGTCCAGCTTCGACCAGGATTCAGAGGGCTGCGAG 
CC TTCTGAGGGGGATGGGCT CGGAGAGGAGGGTCTTCTAT CTAGAC TCTATG AGGAG CCGG C 
T C CAGA CAGGCCACCAGGAGAAAATGAAAC CT AT CTCATG CAAT TCATGGAGGAATGGGGGT 
TATATGTGCAGATGGAAAACT^TGCCAACACTTCCTTTTGCCTTTTGTTTCCTGTGCAAAC 
AAGTGAGTCACCCCTTTGATCCCAGCCATAAAGTACCTGGGATGAAAGAAGTTTTTTCCAGT 
TTGTCAGTGTCTGTGAGAATTACTTATTTCTTTTCTCTATTCTCATAGCACGTGTGTGATTG 
GTTCATGCATGTAGGTCTCTTAACAATGATGGTGGGCCTCTGGAGTCCAGGGGCTGGCCGGT 

TGTTCTATGCAGAGAAAGCAGTCAATAAATGTTTGCCAGACTGGGTGCAGAATTTATTCAGG 
TGGGTGT 
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FIGURE 62 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss .DNA62815 
oubunit 1 of 1, 442 aa, 1 stop 
<MW: 49932, pi: 4.55, NX(S/T) : 5 

MSYNGLHQRVFKELKLLTLCSISSQIGPPEVALTTDEKSISVVLTAPEKWKRNPEDLPVSMQ 
QIYSNLKYOTSVLNTKSNRTWSQCVTNHTLVLTTOEPNTLYCV^ 

CARTLKDQSSEFKAKIIFWYVLPISITVFLFSVMGYSIYRYIHVGKEKHPANLILIYGNEFD 
KRFFVPAEKIVINFITLNISDDSKISHQDMSLLGKSSDVSSLNDPQPSGNLRPPQEEEEVKH 
LGYASHLME I PCDSEENTEGTSLTQQESLSRTIPPDKTVIEYEYDVRTTD I CAGPEEQELSL 
QEEVSTQGTLLESQAAIAVLGPQTLQYSYTPQLQDLDPLAQEHTDSEEGPEEEPSTTLVDWD 

PQTGRLCIPSLSSFDQDSEGCEPSEGDGLGEEGLLSRLYEEPAPDRPPGENETYLMQFMEEW 
GLYVQMEN 

Important features : 
Signal peptide: 

amino acids 1-28 

Transmembrane domain: 

amino acids 140-163 

N-glycosylation sites. 

amino acids 71-74, 80-83, 89-92, 204-207, 423-426 
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FIGURE 63 

CGGACGCGTGGGCGGACGCGTGGGCGGACGCGTGGGTCTCTGCGGGGAGACGCCAGCCTGCG 
TCTGCCATGGGGCTCGGGTTGAGGGGCTGGGGACGTCCTCTGCTGACTGTGGCCACCGCCCT 
GATGCTGCCCGTGAAGCCCCCCGCAGGCTCCTGGGGGGCCCAGATCATCGGGGGCCACGAGG 
TGACCCCCCACTCCAGGCCCTACATGGCATCCGTGCGCTTCGGGGGCCAACATCACTGCGGA 
GGCTTCCTGCTGCGAGCCCGCTGGGTGGTCTCGGCCGCCCACTGCTTCAGCCACAGAGACCT 
CCGCACTGGCCTGGTGGTGCTGGGCGCCCACGTCCTGAGTACTGCGGAGCCCACCCAGCAGG 
TGTTTGGCATCGATGCTCTCACCACGCACCCCGACTACCACCCCATGACCCACGCCAACGAC 
ATCTGCCTGCTGCGGCTGAACGGCTCTGCTGTCCTGGGCCCTGCAGTGGGGCTGCTGAGGCT 
GCCAGGGAGAAGGGCCAGGCCCCCCACAGCGGGGACACGGTGCCGGGTGGCTGGCTGGGGCT 
TCGTGTCTGACTTTGAGGAGCTGCCGCCTGGACTGATGGAGGCCAAGGTCCGAGTGCTGGAC 
CCGGACGTCTGCAACAGCTCCTGGAAGGGCCACCTGACACTTACCATGCTCTGCACCCGCAG 
TGGGGACAGCCACAGACGGGGCTTCTGCTCGGCCGACTCCGGAGGGCCCCTGGTGTGCAGGA 
ACCGGGCTCACGGCCTCGTTTCCTTCTCGGGCCTCTGGTGCGGCGACCCCAAGACCCCCGAC 
GTGTACACGCAGGTGTCCGCCTTTGTGGCCTGGATCTGGGACGTGGTTCGGCGGAGCAGTCC 
CCAGCCCGGCCCCCTGCCTGGGACCACCAGGCCCCCAGGAGAAGCCGCCXSaGCCACAACCT 
TGCGGCATGCAAATGAGATGGCCGCTCCAGGCCTGGAATGTTCCGTGGCTGGGCCCCACGGG 
AAGCCTGATGTTCAGGGTTGGGGTGGGACGGGCAGCGGTGGGGCACACCCATTCCACATGCA 
AAGGGCAGAAG CAAACC CAGTAAAATGTTAACTGACAAAAAAAAAAAAAAAAAAAAGAAA 
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FI G URE 64 

></usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA62845 
xsubunit 1 of l, 283 aa, 1 stop 
><MW: 30350, pi: 9.66, NX{S/T): 2 

MGLGLRGWGRPLLTVATALMLPVKPPAGSWGAQIIGGHEVTPHSRPYMASVRFGGQHHCGGF 
LLRARWVVSAAHCFSHRDLRTGLVVLGAEVLSTAEPTQQVFGIDALTTHPDYHPMTHANDIC 
LLRLNGSAVLGPAVGLLRLPGRRARPPTAGTRCRVAGWGFVSDFEELPPGLMEAKVRVLDPD 
VCNSSWKGHLTLTMLCTRSGDSHRRGFCSADSGGPLVCRNRAHGLVSFSGLWCGDPKTPDVY 
TQVSAFVAWIWDWRRSSPQPGPLPGTTRPPGEAA 

Signal peptide: 

amino acids 1-30 
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FIGURE 65 

GAGCTACCCAGGCGGCTGGTGTGCAGCAAGCTCCGCGCCGACTCCGGACGCCTGACGCCTGA 
CGCCTGTCCCCGGCCCGGC^GAGCCGCTACCTGCTGCCGCTGTCGGCGCTGGGCACGGTAG 
CAGGCGCCGCCGTGCTGCTCAAGGACTATGTCACCGGTGGGGCTTGCCCCAGCAAGGCCACC 
ATCCCTGGGAAGACGGTCATCGTGACGGGCGCCAACACAGGCATCGGGAAGCAGACCGCCTT 
GGAACTGGC CAGGAGAGGAGGC AA CATC ATCCTGGC CTGC CGAGACATGG AG AAGTGTGAGG 
CGGCAGCAAAGGACATCCGCGGGGAGACCCTCAATCACCATGTCAACGCCCGGCACCTGGAC 
TTGGCTTCCCTCAAGT CTATCC GAGAGTTTG C AG CAAAGATCATTGAAGAGGAGGAGCGAGT 
GGACATTCTAATCAACAACGCGGGTGTGATGCGGTGCCCCCACTGGACCACCGAGGACGGCT 
TCGAGATGCAGTTTGGCGTT AACC AC CT GGGT CACTTT CT CTTGACAAACTTG CTGCTGGAC 
AAGCTGAAAGCCTC^GCCCCTTCGCGGATCATCAACCTCTCGTCCCTGGCCCATGTTGCTGG 
GCACATAGACTTTGACGACTTGAACTGGCAGACGAGGAAGTATAACACCAAAGCCGCCTACT 
GCCAGAGCAAGCTCGCCATCGTCCTCTTCACCAAGGAGCTGAGCCGGCGGCTGCAAGGCTCT 
GGTGTGACTGTCAACGCCCTGCACCCCGGCGTGGCCAGGACAGAGCTGGGCAGACACACGGG 
C^TCCATGGCTCCACCTTCTCCAGCACCACACTCGGGCCCATCTTCTGGCTGCTGGTCAAGA 
GCCCCGAGCTGGCCGCCCAGCCCAGCACATACCTGGCCGTGGCGGAGGAACTGGCGGATGTT 
TCCGGAAAGTACTTCGATGGACTCAAACAGAAGGCC CCGGCC C C CGAGG CTGAGGATGAGGA 
GGTGGCCCGGAGGCTTTGGGCTGAAAGTGCCCGCCTGGTGGGCTTAGAGGCTCCCTCTGTGA 
GGGAG CAG CC CCTCCC CAGAJ^ACCT CTGGAGCAGATTTG AAAGCCAGGATGGCGCCTC CAG 
AC CGAGGACAGCTGT CCGC CATGC CCGCAGCTTCCT GGCACTAC CTGAGC CGGGAGAC CCAG 
GACTGGCGGCCGCCATGCCCGCAGTAGGTTCTAGGGGGCGGTGCTGGCCGCAGTGGACTGGC 
CTGCAGGTGAGCACTGCCCCGGGCTCTGGCTGGTTCCGTCTGCTCTGCTGCCAGCAGGGGAG 
AGGGGCCATCTGATGCTTCCCCTGGGAATCTAAACTGGGAATGGCCGAGGAGGAAGGGGCTC 
TGTGCACTTGCAGGCCACGTCAGGAG AG C C AGCGGT GC CTGT CGGGGAGGGTTCCAAGGTGC 
TCCGTGAAGAGCATGGGCAAGTTGTCTGACACTTGGTGGATTCTTGGGTCCCTGTGGGACCT 
TGT G CAT G CAT GGT C CT CT CTG AG C CTT GG TTT C TT CAG C AGT G AG ATG CTCAGAAT AACTG 

CTGTCTCCCATGATGGTGTGGTACAGCGAGCTGTTGTCTGGCTATGGCATGGCTGTGCCGGG 
GGTG TTTG CTGAGGGCTT CCTGTG C CAGAGCCCAGC CAGAGAGCAGGTG CAGGTGTCAT CCC 
GAGTTCAGGCTC TG CACGGC ATGGAGTGGGAACCCCAC CAGCTG CTGCTACAGGAC CTGGGA 

TTGCCTGGGACTCCC^CCTTCCTATCAATTCTCATGGTAGTCCAAACTGCAGACTTCTCA 
TTGCTCATTT 
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FIGURE ft) 

></usr/seqdb2/sst/DMA/Dnaseqs.min/ss.DNA64842 
xsubunit 1 of 1, 331 aa, 1 stop 
><MW: 35932, pi: 8.45, NX(S/T}: 1 

MS RYLLPLSALGTVAGAAVLLKDYVTGGACPS KATI PGKTV I VTGANTG I GKQTALELARRG 

GNIILACRDMEKCEAAAKDIRGETLNHHVNARHLDLASLKSIREFAAKIIEEEERVDILII^ 

AGVMRCPHWTTEDGFEMQFGWHLGHFLLTNLLLDKLKASAPSRIINLSSLAHVAGHIDFDD 

LNWQTRKYNTKAAYCQSKLAIVLFTKELSRRLQGSGVTVNALHPGVART^ 

SSTTLGPIFWLLVKSPELAAQP 

ASSARLVGLEAPSVREQPLPR 

Signal peptide: 

amino acids 1-17 
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FIGURE 67 

GAAGTTCGCGAGCGCTGGCATGTGGTCCTGGGGCGCGGCTGGCGGCGCTGCTGGCGGTGCTG 
GCGCTCGGGACAGGAGACCCAGAAAGGGCTGCGGCTCGGGGCGACACGTTCTCGGCGCTGAC 
CAGCGTGGCGCGCGCCCTGGCGCCCGAGCGCCGGCTGCTGGGGCTGCTGAGGCGGTACCTGC 
GCGGGGAGGAGGCG CGGCTGC GGGAC CTGAC T AG ATT CTACGACAAGGTACTTT CTTTG CAT 
GAGGATTCAACAACCCCTGTGGCTAACCCTCTGCTTGCATTTACTCTCATCAAACGCCTGCA 
GTCTGACTGGAGGAATGT GGTACATAGTCTGGAGGC CAGTGAGAACAT C CGAGCT CTGAAGG 

ATGGCTATGAGAAGGTGGAGCAAGACCTTCCAGCCTTTGAGGACCTTGAGGGAGCAGCAAGG 

GCCCTGATGCGG CTGCAGGACGTGTACATGCT CAATGTGAAAGGCCTGGCCCGAGGTGTCTT 

TCAGAGAGTCACTGGCTCTGCCATCACTGACCTGTACAGCCCCAAACGGCTCTTTTCTCTCA 

CAGGGGATGACTGCTTCCAAGTTGGCAAGGTGGCCTATGACATGGGGGATTATTACCATGGC 

ATTCCATGGCTGGAGGAGGCTGTCAGTCTCTTCCGAGGATCTTACGGAGAGTGGAAGACAGA 

GGATGAGGCAAGTCTAGAAGATGCCTTGGATCACTTGGCCTTTGCTTATTTCCGGGCAGGAA 

ATGTTTCGTGTGCCCTCAGCCTCTCTCGGGAGTTTCTTCTCTACAGCCCAGATAATAAGAGG 

ATGG C C AGGAATGTCTTGAAATATGAAAGG CT CTTGGCAGAGAG CCC CAAC CACGTGGTAGC 

TGAGG CTGTCAT CC AGAGGC C CAATATACCCCAC CTGCAGAC CAGAGACACCTACGAGGGGC 

TATGTCAGACCCTGGGTTCCCAGCCCACTCTCTACCAGATCCCTAGCCTCTACTGTTCCTAT 

GAGACCAATTCCAACGCCTACCTGCTGCTCCAGCCCATCCGGAAGGAGGTCATCCACCTGGA 

GCCCTACATTGCTCTCTACCATGACTTCGTCAGTGACTCAGAGGCTCAGAAAATTAGAGAAC 

TTGC AGAACCATGG CTACAGAGGTCAGTGGTGG CAT CAGGGG AG AAG CAGTTACAAGTGGAG 

TACCGCATGAGCAAAAGTGCCTGGCTGAAGGACACTGTTGACCCAAAACT 

CCACCGCATTGCTGCCCTCACAGGCCTTGATGTCCGGCCTCCCTATGCAGAGTATCTGCAGG 

TGGTGAACTATGGCATCGGAGGACACTATGAGCCTCACTTTGACCATGCTACGTCACCAAGC 

AGCCCCCTCTACAGAATGAAGTCAGGAAACCGAGTTGCAACATTTATGATCTATCTGAGCTC 

GGTGGAAG CT GGAGGAGCCACAGC CT TCAT CTATG C CAAC CT CAGCGTGCCTGTGGTTAGGA 

ATGCAGCACTGTTTTGGTGGAACCTGCACAGGAGTGGTGAAGGGGACAGTGACACACTTCAT 
GCTGGCTGTCCTGTCCTGGTGGGAGATAAGTGGGTGGCCAACAAGTGGATACATGAGTATGG 
ACAGGAATTC CG CAGAC C CTG CAG CT C CAG CC CTGAAGACT^ACTGTTGGCAGAGAGAAGC 
TGGTGGAGTCCTGTGGCTTTCCAGAGAAGCCAGGAGCCAAAAGCTGGGGTAGGAGAGGAGAA 
AGCAGAGCAGCCTCCTGGAAGAAGGCCTTGTCAGCTTTGTCTGTGCCTCGCAAATCAGAGGC 
AAGGGAGAGGTTGTTAC CAGGGGA CACTGAGAATGTACATTTGATCTG CCCCAGC CACGGAA 
GTCAGAGTAGGATGCACAGTACAAAGGAGGGGGGAGTGGAGGCCTGAGAGGGAAGTTTCTGG 
AGTTCAGATACTCTCTGTTGGGAACAGGACATCTCAACAGTCTCAGGTTCGATCAGTGGGTC 
TTTT GG CACTTTGAAC CTTGA C CACAGGGAC CAAGAAGTGG C AATGAGGACACCTG CAGGAG 

GGGCTAGCCTGACTCCCAGAACTTTAAGACTTTCTCCCCACTGCCTTCTGCTGCAGCCCAAG 

CAGG GAGTGT CCCCCT CC CAGAAGCATATCC CAGATGAGTGGTACATTAT ATAAGGATTTTT 

TTTAAGTTGAAAACAACTTTCTTTTCTTTTTGTATGATGGTTTT7TAACACAGTCATTAAAA 
ATGTTTATAAAT CAAAA 
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FIGURE 68 

MGPGARLAALLAVLALGTGDPERAAARGDTFSALTSVARALAPERRLLGLLRRYLRGEEARL 
RDLTRFYDKVLSLHEDSTTPVANPLLAFTLIKRLQSDWRNVVHSIjEASENIRALKDGYEKVE 
QDLPAFEDLEGAARALMRLQDVYMLNVKGIARGVFQRVTGSAITDLYSPKRLFSLTGDDCFQ 
VGKVAYDMGDYYHAIPWLEEAVSLFRGSYGEMKTEDEASLEDALDHLAFAYFRAGNVSCALS 
LSREFLLYSPDNKRMARNVLKYERLLAESPNHVVAEAVIQRPNIPHLQTRDTYEGLCQTLGS 
QPTLYQIPSLYCSYETNSNAYLLLQPIRKEVIHLEPYIALYHDFVSDSEAQKIRELAEPWLQ 
RSVVASGEKQLQVEYRISKSAWLKDTVDPKLVTLNHRIAALTGLDVRPPYAEYLQVVNYGIG 
GHYEPHFDHATSPSSPLYRMKSGNRVATFMIYLSSVEAGGATAFIYANLSVPVVRNAALFWW 
NLHRSGEGDSDTLHAGCPVLVGDKWVANKWIHEYGQEFRRPCSSSPED 

Signal peptide: 

amino acids 1-19 
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FIGURE 69 

GAGATAGGGAGTCTGGGTTTAAGTTCCTGCTCCATCTCAGGAGCCCCTGCTCCCACCCCTAG 
GAAGCCACCAGACTCCACGGTGTGGGGCCAATCAGGTGGAATCGGCCCTGGCAGGTGGGGCC 
ACGAGCGCTGGCTGAGGGACCGAGCCGGAGAGCCCCGGAGCCCCCGTAACCCGCGCGGGGAG 
CGCCCAGGATGCCGCGCGGGGACTCGGAGCAGGTGCGCTACTGCGCGCGCTTCTCCTACCTC 
TGGCTCAAGTTTTCACTTATCATCTATTCCACCGTGTTCTGGCTGATTGGGGCCCTGGTCCT 
GTCTGTGGGCAT CTATGCAG AGGTTG AG CGG CAGAAATATAAAAC C CTTGAAAGTGCCTTCC 
TGGCTCCAGCCATCATCCTCATCCTCCTGGGCGTCGTCATGTTCATGGTCTCCTTCATTGGT 
GTGCTGGCGTCCCTCCGTGACAACCTGTACCTTCTCCAAGCATTCATGTACATCCTTGGGAT 
CTGCCTCATCATGGAGCTCATTGGTGGCGTGGTGGCCTTGACCTTCCGGAACCAGACCATTG 
ACTTCCTGAACG ACAACATT CGAAGAGGAATTGAGAACTACTATGATGAT CTGGACTTCAAA 
AACATCATGGACTTTGTTCAGAAAAAGTTCAAGTGCTGTGGCGGGGAGGACTACCGAGATTG 
GAGCAAGAATCAGTACCACGACTGCAGTGCCCCTGGACCCCTGGCCTGTGGGGTGCCCTACA 
CCTGCTGCATCAGGAACACGACAGAAGTTGTCAACACCATGTGTGGCTACAAAACTATCGAC 
AAGGAGCGTTTCAGTGTGCAGGATGTCATCTACGTGCGGGGCTGCACCAACGCCGTGATCAT 
CTGGTTCATGGACAACTACACCATCATGGCGTGCATCCT 

TCCTGGGGGTGCTGCTGACGCTGCTGTACATCACCCGGGTGGAGGACATCATCATGGAGCAC 
TCTGTCACTGATGGGCTCCTGGGGCCCGGTGCCAAGCCCAGCGTGGAGGCGGCAGGCACGGG 
ATG CTGCTTGTGCTAC CC CAAT2&GGG CCCAGC CTGC CATGG CAGCT C CAACAAGGACCGTC 
TGGGATAGCACCTCTCAGTGAACATCGTGGGGCTGGACAGGGCTGCGGCCCCTCTGCCCACA 
CTCAGTACTGACCAAAGCCAGGGCTGTGTGTGCCTGTGTGTAGGTCCCACGGCCTCTGCCTC 
CCCAGGGAGCAGAGCCTGGGCCTCCCCTAAGAGGCTTTCCCCGAGGCAGCTCTGGAATCTGT 
GCCCACCTGGGGCCTGGGGAACAAGGCCCTCCTTTCTCCAGGCCTGGGCTACAGGGGAGGGA 
GAGCCTGAGGCTCTGCTCAGGGCCCATTTCATCTCTGGCAGTGCCTTGGCGGTGGTATTCAA 
GGCAGTTTTGTAGCAC CTGTAATTGGGGAGAGGGAGTG TGC C CCT CGGGG CAGGAGGGAAGG 
GCATCTGGGGAAGGGCAGGAGGGAAGAGCTGTCCATGCAGCCACGCCCATGGCCAGGTTGGC 
CTCTTCTCAGCCTCCCAGGTGCCTTGAGCCCTCTTGCAAGGGCGGCTGCTTCCTTGAGCCTA 
GTTTTTTTTTACGTGATTTT TG TAACATTCATTTTTTTGT ACAG AT AACAGGAGTTTCTGAC 
TAATCAAAGCTGGTATTTCCCCGCATGTCTTATTCTTGCCCTTCCCCCAACCAGTTTGTTAA 
TCAAACAATAAAAACATGTT TTGTTTTGTTTTTAAAAAAAAA 
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FIGURE 70 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA64863 
xsubunit 1 of 1, 294 aa, l stop 
><MW: 33211, pi: 5.35, NX(S/T): 3 

MPRGDSEQVRYCARFS YL WLKF SL 1 1 YSTVFWL I GALVLS VG I YAE VERQKYKTLESAFLAP 
AIILILLGVVMFWSFIGVLASLRDNLYLLQAFMYILGICLIMELIGGWALTFRNQTIDFL 
NDNIRRGlEimDDLDFKNIMDFVQKKFKCCGGEDYRDWSKNQYHDCSAPGPLACGVPYTCC 
IRNTTEWNTMCGYKT IDKERFSVQDVIYVRGCTNAVI IWFMDNYTIMACILLGILLPQFLG 
VLLTLLYITRVED I IMEHSVTDGLLGPGAKPS VEAAGTGCCLCYPN 

Signal peptide: 

amino acids 1-44 

Transmembrane domains: 

amino acids 22-42, 57-85, 93-116, 230-257 
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FIGURE 71 

GAGGAG CGGGC CGAGGAC TC CAGCGTGC C CAGGTCTGG CATC CT G CACTTGCTG CCCT CTGA 

CACCTGGGAAGATGGCCGGCCCGTGGACCTTCACCCTTCTCTGTGGTTTGCTGGCAGCCACC 

TTGATCCAAGCCACCCTCAGTCCCACTGCAGTTCTCATCCTCGGCCCAAAAGTCATCAAAGA 

AAAGCTGACACAGGAGCTGAAGGACCACAACGCCACCAGCATCCTGCAGCAGCTGCCGCTGC 

TCAGTGCCATGCGGGAAAAGCCAGCCGGAGGCAT CC CTGTGCTGGGCAGCCT GGTGAACACC 

GTCCTGAAGCACATCATCTGGCTGAAGGTCATCACAGCTAACATCCTCCAGCTGCAGGTGAA 

GCCCTCGGCCAATGACCAGGAGCTGCTAGTCAAGATCCCCCTGGACATGGTGGCTGGATTCA 

ACACGCC C CTGGTCAAGACCAT CGTGGAGTTCCACATGACGACTGAGGCCCAAG CCACCATC 

CGCATGGACACCAGTGCAAGTGGCCCCACCCGCCTGGTCCTCAGTGACTGTGCCACCAGCCA 

TGGGAGCCTGCGCATCC^CTGCTGTATAAGCTCTCCTTCCTGGTGAACGCCTTAGCTAAGC 

AGGTCATGAACCTCCTAGTGCCATCCCTGCCCAATCTAGTGAAAAACCAGCTGTGTCCCGTG 

AT CGAGGCTT CCTTCAATGGCATGTATGCAGACCTC CTGCAGCTGGTGAAGGTGCC CATTTC 

CCT C AG CATTGAC CGT CTGGAGTTTGAC CT T CTGTAT C CTGC CATCAAGGGTGACACCATTC 

AGCT CT AC CTGGGGGCCAAGTTGT TGGACT CACAGGGAAAGGTG AC CAAG TGGTTC AATAAC 

TCTGC^GCTTCCCTGAC^TGCCCACCCTGGACAACATCCCGTTCAGCCTCATCGTGAGTCA 

GGACGTGGTGAAAGCTGC^GTGGCTGCTGTGCTCTCTCCAGAAGAATTCATGGTCCTGTTGG 

ACTCTGTGCTTCCTGAGAGTGCCCATCGGCTGAAGTCAAGCATCGGGCTGATCAATGAAAAG 

GCTG CAGATAAG CTGGGAT CTACC CAGATC GTGAAGAT C CTAACTCAGGACACTCCCGAGTT 

TT TTATAGAC CAAGGCCATG CCAAGG TGGC C CAACTGATCGTGCTGGAAGTGT TTC CCTCCA 

GTGAAGCCCTCCGCCCTTTGTTCACCCTGGGCATCGAAGCCAGCTCGGAAGCTCAGTTTTAC 

ACCAAAGG TGACCAACTTATACTCAACTTGAATAACATCAGCTCTGAT CGGATCCAGCTGAT 

GAACTCTGGGATTGGCTGGTTCCAACCTGATGTTCTGAAAAACATCATCACTGAGATCATCC 

ACTCCATC CTGCTGCCGAACCAGAATGGCAAATTAAGATCTGGGGT CC CAGTGTCATTGGTG 

AAGGCCTTGGGATTCGAGGCAGCTGAGTCCTCACTGACCAAGGATGCCCTTGTGCTTACTCC 

AGCCTCCTTGTGGAAACCCAGCTCTCCTGTCTCCCAGTGAAGACTTGGATGGCAGCCATCAG 

GGAAGGCTGGGTCCCAGCTGGGAGTATGGGTGTGAGCTCTATAGACCATCCCTCTCTGCAAT 
CAATAAACACTTGCCTGTGAAAAA 
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FIGURE 72 

>< /usr/ seqdb2/ss t/DNA/Dnaseqs . min/ss . DNA64 881 
xsubunit 1 of 1, 484 aa, I atop 
><MW: 52468, pi; 7.14, NX(S/T): 3 

MAGPWTFTLLCGLLAATL IQATLS PTAVLI LGPKVI KEKLTQELKDHNATS ILQQLPLLSAM 

REKPAGGIPVI^SLVNTVLKHIIVTLK^ITANILQLQVKPSANDQELLVKIPLDMVAGFNTP^ 

VKTIVEFHMTTEAQATIRMDTSASGPTRLVLSDCATSHGSLRIQLLYKLSFLWAIJVKQVMN 

LLVPSLPNLVKNQLCPVIEASFNGMYADLLQLVKVPISLSIDRLEFDLLYPAIKGDTIQLYL 

GAKLLDSQGKVTKWFNNSAASLTMPTLDNIPFSLIVSQDWKAAVAAVLSPEEFMVLLDSVL 

PESAHRLKSS IGLINEKAADKLGSTQ I VKI LTQDTPEFF IDQGHAKVAQL I VLEVFPS SEAL 

RPLFTLGIEASSEAQFYTKGDQLILNLNNISSDRIQIJ^SGIGWFQPDV^ 

LPNQNGKLRSGVPVSLVKALGFEAAESSLTKDALVLTPASLWKPSSPVSQ 

Important features of the protein: 
Signal peptide: 

amino acids 1-21 

N-glycosylation sites. 

amino acids 48-51, 264-267, 401-404 

Glycosaminoglycan attachment site. 

amino acids 412-415 

LBP / BPI / CETP family proteins. 

amino acids 407-457 



71/X70 



WO 00/12708 



PCT/US99/201M 



FIGURE 73 

GAGCGAACATGGCAGCGCGTTGGCGGTTTTGGTGTGTCTCTGTGACCATGGTGGTGGCGCTG 
CTCATCGTTTGCGACGTTCCCTCAGCCTCTGCCCAAAGAAAGAAGGAGATGGTGTTATCTGA 
AAAGGT T AGT C AGCTGATGGAATGGACT AAC AAAAGAC CTGTAATAAGAATG AATGGAGACA 
AGTTCCGTCGCCTTGTGAAAGCCCCACCGAGAAATTACTCCGTTATCGTCATGTTCACTGCT 
. CTCCAACTGCATAGACAGTGTGTCGTTTGCAAGCAAGCTGATGAAGAATTCCAGATCCTGGC 
AAACTCCTGGCGATACTCCAGTGCATTCACCAACAGGATATTTTTTGCCATGGTGGATTTTG 
ATGAAGGCTCTGATGTATTTCAGATGCTAAACATGAATTCAGCTCCAACTTTCATCAACTTT 
CCTG CAAAAGGG AAAC CCAAAC GGGG TG AT AC AT ATGAGTTACAGGTGCGGGGTTTTTCAGC 
TGAGCAGATTGCCCGGTGGATCGCCGACAGAACTGATGTCAATATTAGAGTGATTAGACCCC 
CAAATTATGCTGGTCCCCTTATGTTGGGATTGCTTTTGGCTGTTATTGGTGGACTTGTGTAT 
CTTCGAAGAAGTAATATGGAATTTCTCTTTAATAAAACTGGATGGGCTTTTGCAGCTTTGTG 
TTTTGT GCTT GCTATG AC AT CTGGT CAAATGTGGAACCATATAAGAGGACCACCATATGCCC 
ATAAGAATC C CCACACGGGACATGTGAATTATATCCATGGAAGCAGTCAAGCCCAGTTTGTA 
GCTGAAACACACATTGTTCTTCTGTTTAATGGTGGAGTTACCTTAGGAATGGTGCTTTTATG 
TGAAGC TG CT AC CT CTGACATGGATATTGGAAAGCGAAAGATAATGTGTGTGGCT GG TATTG 
GACTTGTTGTATTATTCTTCAGTTGGATGCTCTCTATTTTTAGATCTAAATATCATGGCTAC 
CCAT ACAG CT TT CTGATG AGTTA^AAAGGT CCCAGAGATATATAGACACTGGAGTACTGGAA 
ATTGAAAAAC GAAAATCGTGTGTGTTTG AAAAGAAGAAT G CAAC TTGTATATTTTGTATTAC 
CT CTTTTTTT CAAGTGATTTAAATAGTTAATCATTTAACCAAAGAAGATGTGTAGTGCCTTA 
ACAAGCAATCCTCTGTC^AAATCTGAGGTATTTGAAAATAATTATCCTCTTAACCTTCTCTT 
C C CAGTGAACTT T ATG G AA CATTTAATTT AG T ACAATT AAGT AT ATT AT AAAAATT G T AAAA 
CTACT ACTTTGTTTTAGTTAGAAC AAAG CT CAAAACTACTTTAGTTAACT TGGTCATCTGAT 
TTTATATTGCCTTATCCAAAGATGGGGAAAGTAAGTCCTGAC CAGGTGTT CCCACATATGCC 
TGTTACAGATAACT ACATTAGG AATT CATT CTTAGCTTCTT CAT CTTTGTGTGGATGTGTAT 
ACTTTACGCATCTTTCCTTTTGAGTAGAGAAATTATGT GTGT CATGTG GTCTTCTGAAAATG 
GAACACGATTCTTCAGAGCACACGTCTAGCCCTCAGCAAGACAGTTGTTTCT 
GCATATTT CC TACTGCG C T CCAGC CTGAGTGATAGAGTGAGACTCTGTCT CAAAAAAAAGTA 
TCTCTAAATACAGGATTATAATTTCTGCTTGAGTATGGTGTTAACTACCTTGTATTTAGAAA 
G ATT TCAG AT T CATTCCAT C TC CTTAGTTTTC TTTTAAGGTGAC CCATCTGTGATAAAAATA 
TAGCTTAGTGCTAAAATCAGTGTAACTTATACATGGCCTAAAATGTTTCTACAAATTAGAGT 
TTGT CACTTATT C CATTTGT AC CTAAGAGAAAAATAGGCTCAGTTAGAAAAGGACT CCCTGG 
CC^GGCGCAGTGACTTACGCCTGTAATCTCAGCACTTTGGGAGGCCAAGGCAGGCAGATCAC 
GAGGTCAGGAGTTCGAGACCATCCTGGCCAACATGGTGAAACCCCGTCTCTACTAAAAATAT 
AAAAATTAGCTGGGTGTGGTGGCAGGAGCCTGTAATCCCAGCTACACAGGAGGCTGAGGCAC 
GAGAAT C ACT TGAACT CAG GAGATGGAGGTTT CAGTGAGC CGAG AT CACG CCACTG CACTC C 
AGCCTGG CAACAGAGCGAGACTCCAT CTCAAAAAAAAAAAAAA 
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FIGURE 74 

• MAARWRFWCTSVTMWALLIVCDVP 
RkVTtAPPRNYSVIVMFTALQLHRQCWCKQADEEFQ 

SDVFQMLNMNSAPTFINFPAKGKPKRGDTYELQVRGFSAEQIARWIADRTDVNIRVIRPPNY 
AGPL^GLLLAV IGGLVYLRRSNME FLFNKTGWAFAALCFVLAOT GQMWNH IRGP PYAHKN 

PHTGHVNYIHGSSQAQFVAETHIVLLFNGGVTLGMVLLCEAATSDMDIGKRKIMCVAGIGLV 
VLFFSWMLS IFRSKYHGYPYSFLMS 

Signal peptide: 

amino acids 1-29 

Transmembrane domains : 

amino acids 183-205, 217-237, 217-287, 301-321 
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FIGURE 75 

AAGCAACCAAACTGCAAGCTTTGGGAGTTGTTCGCTGTCCCTGCCCTGCTCTGCTAGGGAGA 
GAACGCCAGAGGGAGGCGGCTGGCCCGGCGGCAGGCTCTCAGAACCGCTACCGGCGATGCTA 
CTGCTGTGGGTGTCGGTGGTCGCAGCCTTGGCGCTGGCGGTACTGGCCCCCGGAGCAGGGGA 
GCAGAGGCGGAGAGCAGCCAAAGCGC C C AATG TGGT GCTGGT CGTG AG CGACT C CT TCGATG 
GAAGGTTAACATTTCATCCAGG AAGT CAGGTAGTGAAACTTC CTTTT AT CAAC TTT ATGAAG 
ACACGTGGGACTTCCTTTCTGAATGCCTACACAAACTCTCCAATTTGTTGCCCATCACGCGC 
AG CAATGTGGAGTGG CCT CTTCACTC ACTTAACAGAAT CT TGGAATAATTTTAAGGGTCTAG 
AT C CAAATTATA CAACATGG AT GGAT GT CATGGAGAGG CATGG C TA CCGAACACAGAAATTT 
GGGAAACTGGACTATACTTCAGGACATCACTCCATTAGTAATCGTGTGGAAGCGTGGACAAG 
AG ATGTTG CTTT CTTACT CAGACAAGAAGG CAGGCC CATGGTTAAT CTTATCCGTAACAGGA 
CTAAAGTCAGAGTGATGGAAAGGGATTGGCAGAATACAGACAAAGCAGTAAACTGGTTAAGA 
AAGGAAGCAATTAATTACACTGAACCATTTGTTATTTACTTGGGATTAAATTTACCACACCC 
TTACCCTTCACCATCTTCTGGAGAAAATTTTGGATCTTCAACATTTCACACATCTCTTTATT 
GG CTTGAAAAAG TGT CT CATGATGCCAT CAAAATC CCAAAGTGGT CAC CTTTGTCAGAAATG 
CA C C CTGTAGAT TATT AC TCTT CTTATACAAAAAACTGCACTGGAAGATTTACAAAAAAAGA 
AATTAAGAATATTAGAGCATTTTATTATGCTATGTGTGCTGAGACAGATGCCATGCTTGGTG 
AAATTATTTTGG C CC TT CATCAATTAGATCTT CTT C AGAAAA CTATTGT C ATATAC T C CT CA 
GACC ATGG AGAGCTGGC CATGGAACAT CGACAGTTTTATAAAATGAGCATGTACGAGGCTAG 
TG CACATG TTCCGCTTTTG ATGATGGGACCAGGAATTAAAGC CGG C CT ACAAGTAT CAAATG 
TGGTTTCTCTTGTGGATATTTACCCTACCATGCTTGATATTGCTGGAATTCCTCTGCCTCAG 
AACCTGAGTGGATACTCT TTGTTG CCG TTATCAT CAGAAACATTTAAGAATGAACATAAAGT 
CAAAAACCTGCATCCACCCTGGATTCTGAGTGAATTCCATGGATGTAATGTGAATGCCTCCA 
CCTACATGCTTCGAACTAAC CACT GGAAAT ATAT AG C CTATTCGGATGGTGCATCAATATTG 
CCTCAACTCTTTGATCTTTCCTCGGATCCAGATGAATTAACAAATGTTGCTGTAAAATCT 
AG AAATTACTTATT CTTTGG AT CAGAAG CTT CATT C CATT ATAAA CT ACCCT AAAG TTTCTG 
CTTC TGTC CACCAGTATAATAAAG AGCAGT TT AT CAAGTGGAAACAAAGTATAGGACAGAAT 
TATTCAAACGTT AT AGCAAATCTT AG GT GG CACCAAGACTGGCAGAAGGAACCAAGGAAGTA 
TG AAAATG CAA T TG AT CAGT GG CTTAAAAC C C AT AT G AAT C CAAGAG CAGTT TGAA CAAAAA 
GTTTAAAAATAGTGTTCTAGAGATACATATAAATATATTACAAGATCATAATTATGTATTTT 
AAATGAAACAGTTTTAATAATTACCAAGTTTTGGCCGGGCACAGTGGCTCACACCTGTAATC 
CCAGGACTTTGGGAGGCTGAGGAAAGCAGATCACAAGGTCAAGAGATTGAGACCATCCTGGC 
CAACATGGTGAAACCCTGTCTCTACTAAAAATACAAAAATTAGCTGGGCGCGGTGGTGCACA 
CCT ATAGTCT CAGCTACT CAGAGGCTGAGGCAGG AGGATCGCTTGAACC C GGGAGGCAGCAG 
TTGCAGTGAGCTGAGATTGCGCCACTGTACTCCAGCCTGGCAACAGAGTGAGACTGTGTCGC 
AAAAAAAT AAAAATAAAATAAT AAT AATT AC CAA TTTT T CAT T ATTTT GT AAGAATGTAG TG 
TATTTT AAGATAAAATGCCAATGATTATAAAATCACATATTTT CAAAAAT GGTT ATT ATTTA 
GGC CTTTGTACAATTTCTAACAATTT AGTGGAAG T ATCAAAAGGATTGAAGCAAATACTG TA 
ACAGTTATGTTCCTTTAAATAATAGAGAATATAAAATATTGTAATAATATGTATCATAAAAT 
AGTTGTATGTGAGCATTTGATGGTGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 76 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA64 885 
<subunit 1 of 1, 536 aa, l stop 
<MW: 61450, pi: 9.17, NX(S/T): 7 
MLLLWSWAALALAVIAPGAGEQRRRAAKAPNVVLW 

MKTRGTS F LNAYTNS P I C C P S RAAMWSG LFTH LTE S WNNF KGLD PNYTTWMD VME RHG YRTQ 
KFGKLDYTSGHHSISNRVEAWTRDVAF 

LRKEAINYTEPFVI YLGLNLPHPY PS PS SGENFGSSTFHTSLYWLEKVSHDAI KI PKWSPLS 
EMHPVDYYSSYTKNCTGRFTKKEIKNIRAFYYAMCAETDAMLGEIILALHQLDLLQKTIVIY 
SS DHGELAMEHRQF YKMSWEASAHVPLLMMGPGIKAGLQVSNWSLVDI YPTMLD I AG I PL 
PQNLSGYSLLPLSSETFKNEHKVKtnjHPPWILSEFHGCNVNASTYMLRTNlIWKYJAYSDG^ 
ILPQLFDLSSDPDELTNVAVKFPEITYSLDQKLHSIINYPKVSASVHQYNKEQFIKWKQSIG 
QNYSNVIANLRWHQDWQKEPRKYENAIEQWLKTHMNPRAV 

Important features: 
Signal peptide: 

amino acids 1-15 

N-glycosylation sites, 

amino acids 108-111, 166-169, 193-196, 262-265, 375-378, 413-416, 
498-501 

Sulfatases proteins: 

amino acids 286-315, 359-369, 78-97 
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FIGURE 77 

G AGAG AAGTCAGCCTGGCAGAGAGACT CTG AAATGAGGGATT AGAGGTGTTC AAGG AG CAAG 
AGCTTCAGCCTGAAGACAAGGGAGCAGTCCCTGAAGACGCTTCTACTGAGAGGTCTGCC&TG 
GCCTCTCTTGGCCTCCAACTTGTGGGCTACATCCTAGGCCTTCTGGGGCTTTTGGGCACACT 
GGTTGC^TGCTGCTCCCCAGCTGGAAAACAAGTTCTTATGTCGGTGCCAGCATTGTGACAG 
CAGTTGGCTTCTCCAAGGGCCTCTGGATGGAATGTGCCACACACAGCACAGGCATCACCCAG 
TGTGACATCTATAG CACC CTT CTGGG CCTG CCCG CTGACAT C CAGG CTG CCCAGGCCATGAT 

GGTGACATCCAGTGCAATCTCCTCCCTGGCCTGCATTATCTCTGTGGTGGGCATGAGATGCA 
CAGTCTTCTGCCAGGAATCCCGAGCCAAAGACAGAGTGGCGGTAGCAGGTGGAGTCTTTTTC 
ATCCTTGGAGGCCTCCTGGGATTCATTCCTGTTGCCTGGAATCTTCATGGGATCCTACGGGA 
CTTCTACTCACCACTGGTGCCTGACAGCATGAAATTTGAGATTGGAGAGGCTCTTTACTTGG 
GCATTATTTCTTCCCTGTTCTCCCTGATAGCTGGAATCATCCTCTGCTTTTCCTGCTCATCC 
CAGAGAAATCGCTCCAACTACTACGATGCCTACCAAGCCCAACCTCTTGCCACAAGGAGCTC 
TCCAAGGCCTGGTCAACCTCCCAAAGTCAAGAGTGAGTTCAATTCCTACAGCCTGACAGGGT 
ATGTGTGAAGAACCAGGGGCCAGAGCTGGGGGGTGG CTGGGT CTGTGAAAAACAGTGGACAG 
CACCCCGAGGGCCACAGGTGAGGGACACTACCACTGGATCGTGTCAGAAGGTGCTGCTGAGG 
ATAGACTGACT TTGGC CATTGGATTGAGCAAAGG CAGAAATGGGGG CTAGTGTAACAG CATG 

CAGGTTGAATTGCCAAGGATGCTCGCCATGCCAGCCTTTCTGTTTTCCTCACCTTGCTGCTC 
CCCTG CCCTAAG TC CCCAAC CCTCAACTTG AAACC CCATT CC CTTAAGCCAGGACT CAGAGG 
ATCCCTTTGCCCTCTGGTTTACCTGGGACTCCATCCCCAAACCCACTAATCACATCCCACTG 
ACTGACCCTCTGTGATCAAAGACCCTCTCTCTGGCTGAGGTTGKSCTCTTAGCTCATTGCTGG 
GGATGGGAAGGAGAAGCAGTGGCTTTTGTGGGCATTGCTCTAACCTACTTCTCAAGCTTCCC 
TCCAAAGAAACTGATTGGCCCTGGAACCTCCATCCCACTCTTGTTATGACTCCACAGTGTCC 
AGACTAATTTGTGCATGAACTGAAATAAAACCATCCTACGGTATCCAGGGAACAGAAAGCAG 
GATG CAGG ATGGGAG G AC AGG AAGGCAG C CTGGGAC ATTT AAAAAAATA 
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FIGURE 78 

></u S r/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA64886 
xsubunit 1 of l, 230 aa f l stop 
><MW: 24549, pi: 8.56, NX(S/T) : I 

MASI^LQLVGYILGLLGLU3TLVAm,LPSWKTSSYVGASIVTAVGFSKGLW1^0VTHSTGIT 
QCDI YSTLLGLP AD IQ AAQAMMVTSSAI SSLACI I S WGMRCTVFCQESRAKDRVAVAGGVF 
FILGGLLGFIPVAWNLHGILRDFYSPLVPDSMKFEIGEALYLGIISSLFSLIAGIILCFSCS 
SQRNRSNYYDAYQAQPLATRSSPRPGQPPKVKSEFNSYSLTGYV 

Important features of the protein: 
Signal peptide: 

amino acids 1-24 

Transmembrane domains: 

amino acids 82-102, 117-140, 163-182 

N-glycosylation site. 

amino acids 190-193 

PMP-22 / EMP / MP2 0 family proteins. 

amino acids 46-59 
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FIGURE 79 

GCACTGCTGCTGTCCCATCAGCTGCTCTGAAGCTCCATGGTGCCCAGAATCTTCGCTCCTGC 
TTATGTGTCAGTCTGTCTCCTCCTCTTGTGTCCAAGGGAAGTCATCGCTCCCGCTGGCTCAG 
AAC CATGGCTGTG CCAGC CGGCAC C CAGG TGTGG AGACAAGATCTACAAC CCCTTGGAG CAG 

TGCTGTTACAATGACGCCATCGTGTCCCTGAGCGAGACCCGCCAATGTGGTCCCCCCTGCAC 
CTTCTGGCCCTGCTTTGAGCTCTGCTGTCTTGATTCCTTTGGCCTCACAAACGATTTTGTTG 
TGAAGCTGAAGGTTCAGGGTGTGAATTCCCAGTGCCACTCATCTCCCATCTCCAGTAAATGT 
GAAAGCAGAAGACGTTTTCCCTGAGAAGACATAGAAAGAAAATCAACTTTCACTAAGGCATC 
TCAGAAACATAGGCTAAGGTAATATGTGTACCAGTAGAGAAGCCTGAGGAATTTACAAAATG 
ATGCAGCTCCAAGCCATTGTATGGCCCATGTGGGAGACTGATGGGACATGGAGAATGACAGT 
AGATTATCAGGAAATAAATAAAGTGGTTTTTCCAATGTACACACCTGTAAAA 
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FIGURE AO 

MVPRIFAPAyvSVCLLLLCPREVIAPAGSEPWLCQPAPRCGDKIYNPLEQCCYNDAIVSLSE 
TRQCGPPCTFWPCFELCCLDSFGLTNDFWKLKVQGVNSQCHSSPISSKCESRRRFP 

Signal peptide: 
amino acids 1-25 
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FIGURE 81 

CTCCACTGC^CCACCmGAGCCATQGCTCCCCGAGGCTGCATCGTAGCTGTCTTTGCCATT 

TTCTGCATCTCCAGGCTCCTCTGCTCACACGGAGCCCCAGTGGCCCCCATGACTCCTTACCT 

GATGCTGTGCCAGCCACACAAGAGATGTGGGGACAAGTTCTACGACCCCCTGCAGCACTGTT 

GCTATGATGATGCCGTCGTGCCCTTGGCCAGGACCCAGACGTGTGGAAACTGCACCTTCAGA 

GTCTGCTTTGAGCAGTGCTGCCCCTGGACCTTCATGGTGAAGCTGATAAACCAGAACTGCGA 

CTCAGCCCGGACCTCGGATGACAGGCTTTGTCGCAGTGTCAGCTAATGGAACATCAGGGGAA 

CGATGACTCCTGGATTCTCCTTCCTGGGTGGGCCTGGAGAAAGAGGCTGGTGTTACCTGAGA 

TCTGGGATGCTGAGTGGCTGTTTGGGGGCCAGAGAAACACACACTCAACTGCCCACTTCATT 

CTGTGACCTGTCTGAGGCCCACCCTGCAGCTGCCCTGAGGAGGCCCACAGGTCCCCTTCTAG 

AATTCTGGACAGCATGAGATGCGTGTGCTGATGGGGGCCCAGGGACTCTGAACCCTCCTGAT 

GACCCCTATGGCCAACATCAACCCGGCACCACCCCAAGGCTGGCTGGGGAACCCTTCACCCT 

TCTGTGAGATTTTCCATCATCTCAAGTTCTCTTCTATCCAGGAGCAAAGCACAGGATCATAA 
TAAATTTATGTACTTTATAAATGAAAA 



SI /* 70 
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FIGURE 82 

MAPRGCIVAVFAIFCISRLLCSHGAPVAPMTPYLMLCQPHKRCGDKFYDPLQHCCYDDAWP 
LARTQTCGNCTFRVCFEQCCPWTFIWKLINQNCDSARTSDDRLCRSVS 

Signal peptide: 

amino acids 1-24 
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FIGURE S3 

GGGGGCGGGTGCCTGGAGCACGGCGCTGGGGCCGCCCGCAGCGCTCACTCGCTCGCACTCAG 
T CGCGGGAGGCTTCCCCGCG C CGG CCG CGT C CCG C C CG CT C C C CGG CACCAG AAGT TCCTCT 

GCGCGTCCGACGGCGAC^TGGGCGTCCCCACGGCCCTGGAGGCCGGCAGCTGGCGCTGGGGA 
TCCCTGCTCTTCGCTCTCTTCCTGGCTGCGTCCCTAGGTCCGGTGGCAGCCTTCAAGGTCGC 
CACGCCGTATTCCCTGTATGTCTGTCCCGAGGGGCAGAACGTCACCCTCACCTGCAGGCTCT 
TGGGCCCTGTGGACAAAGGGCACGATGTGACCTTCTACAAGACGTGGTACCGCAGCTCGAGG 
GGCGAGGTGCAGACCTGCTCAGAGCGCCGGCCCATCCGCAACCTCACGTTCCAGGACCTTCA 
CCTGCACCATGGAGGCCACCAGGCTGCCAACACCAGCCACGACCTGGCTCAGCGCCACGGGC 
TGGAGTCGGCCTCCGACCACCATGGCAACTTCTCCATCACCATGCGCAACCTGACCCTGCTG 
GATAGCGGCCTCTACTGCTGCCTGGTGGTGGAGATCAGGCACCACCACTCGGAGCACAGGGT 
C CATGGTG CCATGGAGC TGCAGGTGC AG AC AGG C AAAGATG CAC CATCCAACTGTGTGGTGT 
ACCCATCCTCCTCCCAGGATAGTGAAAACATCACGGCTGCAGCCCTGGCTACGGGTGCCTGC 
ATCGTAGGAATCCTCTGCCTCCCCCTCATCCTGCTCCTGGTCTACAAGCAAAGGCAGGCAGC 
CTCCAACCGCCGTGCCCAGGAGCTGGTGCGGATGGACAGCAACATTCAAGGGATTGAAAACC 
CCGGCTTTGAAGCCTCACCACCTGCCCAGGGGATACCCGAGGCCAAAGTCAGGCACCCCCTG 
TCCTATGTGGCCCAGCGGCAGCCTTCTGAGTCTGGGCGGCATCTGCTTTCGGAGCCCAGCAC 
CCCCCTGTCTCCTCCAGGCCCCGGAGACGTCTTCTTCCCATCCCTGGACCCTGTCCCTGACT 
CTCCAAACTTTGAGGTCATCTMCCCAGCTGGGGGACAGTGGGCTGTTGTGGCTGGGTCTGG 
GGCAGGTGCATTTGAGCCAGGGCTGGCTCTGTGAGTGGCCTCCTTGGCCTCGGCCCTGGTTC 
CCTCCCTCCTGCTCTGGGCTCAGATACTGTGACATCCCAGAAGCCCAGCCCCTCAACCCCTC 
TGGATGCTACATGGGGATGCTGGACGGCTCAGCCCCTGTTCCAAGGATTTTGGGGTGCTGAG 
ATTCT CCCCTAG AGACCTG AAATT CACCAG CTACAGATG C CAAATG ACTT ACATCTTAAGAA 
GTCTCAGAACGT CCAGC C CTTC AG CAGCT C TCGTT CTG AG ACATGAGCCTTGGGATGTGGCA 
GCATCAGTGGGACAAGAT GGAC ACTGGG CC AC CCTC CCAGG CAC CAGACACAGGGCACGGTG 
GAGAGACTTCTCCCCCGTGGCCGCCTTGGCTCCCCCGTTTTGCCCGAGGCTGCTCTTCTGTC 
AGACTTCCTCTTTGTACCACAGTGGCTCTGGGGCCAGGCCTGCCTGCCCACTGGCCATCGCC 
ACCTTCCCCAGCTGCCTCCTACCAGCAGTTTCTCTGAAGATCTGTCAACAGGTTAAGTCAAT 
CTGGGGCTTCCACTGCCTGCATTCCAGTCCCCAGAGCTTGGTGGTCCCGAAACGGGAAGTAC 
ATATTGGGGCATGGTGGCCTCCGTGAGCAAATGGTGTCTTGGGCAATCTGAGGCCAGGACAG 
ATGTTGCCCCACCCACTGGAGATGGTGCTGAGGGAGGTGGGTGGGGCCTTCTGGGAAGGTGA 
GTGGAGAGGGGCACCTGCCCCCCGCCCTCCCCATCCCCTACTCCCACTGCTCAGCGCGGGCC 
ATTGCAAGGGTGCCACACAATGTCTTGTCCACCCTGGGACACTTCTGAGTATGAAGCGGGAT 
GCTATTAAAAACTACATGGGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAGA 



23/X10 
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FIGURE 84 

></usr/seqdb2/sst/DNA/Dnaseqs.min/as.DNA64897 
xsubunit 1 of 1, 311 aa, 1 stop 
><MW: 33908, pi: 6.87, NX(S/T): 6 

MGVPTAIiEAGSWRWGSIiFALFLAASLGPVAAFKVATPYSLYVCP3GQNVTLTCRLLGPVDK 
GHDVTFYKTWYRSSRGEVQTCSERRPIRNLTFQDLHLHHGGHQAANTSHDLAQRHGLESASD 
HHGNFSITMRNLTLLDSGLYCCLWEIRHHHSEHRVHGAMELQVQTGKDAPSNCWYPSSSQ 
DSENITAAALATGACIVGILCLPLILLLVYKQRQAASNRRAQELVRMDSNIQGIENPGFEAS 
PPAOGIPE^UCVRHPLSYVAQRQPSESGRHLLSEPSTPLSPPGPGDVFFPSLDPVPDSPNFEVI 

Signal peptide: 

amino acids 1-28 

Transmembrane domain: 

amino acids 190-216 
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FIGURE 85 

CCCACGCGTCCGCGCCTCTCCCTTCTGCTGGACCTTCCTTCGTCTCTCCATCTCTCCCTCCT 

TTCCCCGCGTTCTCTTTCCACCTTTCTCTTCTTCCCACCTTAGACCTCCCTTCCTGCCCTCC 

TTTCCTGCCCACCGCTGCTTCCTGGCCCTTCTCCGACCCCGCTCTAGCAGCAGACCTCCTGG 

GGTCTGTGGGTTGATCTGTGGCCCCTGTGCCTCCGTGTCCTTTTCGTCTCCCTTCCTCCCGA 

CTCCGCTCCCGGACCAGCGGCCTGACCCTGGGGAAAGGAIGGTTCCCGAGGTGAGGGTCCTC 

TCCTCCTTGCTGGGACTCGCGCTGCTCTGGTTCCCCCTGGACTCCCACGCTCGAGCCCGCCC 

AGACATGTTCTGCCTTTTCCATGGGAAGAGATACTCCCCCGGCGAGAGCTGGCACCCCTACT 

TGGAGCCACAAGGCCTGATGTACTGCCTGCGCTGTACCTGCTCAGAGGGCGCCCATGTGAGT 

TGTTACCGCCTCCACTGTCCGCCTGTCCACTGCCCCCAGCCTGTGACGGAGCCACAGCAATG 

CTGTCCCAAGTGTGTGGAACCTCACACTCCCTCTGGACTCCGGGCCCCACCAAAGTCCTGCC 

AGCACAACGGGACCATGTACCAACACGGAGAGATCTTCAC?rGCCCATGAGCTGTTCCCCTCC 

CGCCTGCCCAACCAGTGTGTCCTCTGCAGCTGCACAGAGGGCCAGATCTACTGCGGCCTCAC 

AACCTGCCCCGAACCAGGCTGCCCAGCACCCCTCCCACTGCCAGACTCCTGCTGCCAAGCCT 

GCAAAGATGAGGCAAGTGAGCAATCGGATGAAGAGGACAGTGTGCAGTCGCTCCATGGGGTG 

AGACATCCTCAGGATCCATGTTCCAGTGATGCTGGGAGAAAGAGAGGCCCGGGCACCCCAGC 

CCCCACTGGCCTCAGCGCCCCTCTGAGCTTCATCCCTCGCCACTTCAGACCCAAGGGAGCAG 

GCAGCACAACTGTCAAGATCGTCCTGAAGGAGAAACATAAGAAAGCCTGTGTGCATGGCGGG 

AAGACGTACTCCCACGGGGAGGTGTGGCACCCGGCCTTCCGTGCCTTCGGCCCCTTGCCCTG 

CATCCTATGCACCTGTGAGGATGGCCGCCAGGACTGCCAGCGTGTGACCTGTCCCACCGAGT 

ACCCCTGCCGTCACCCCGAGAAAGTGGCTGGGAAGTGCTGCAAGATTTGCCCAGAGGACAAA 

GC^GACCCTGGCCacaGTGAGATCAGTTCTACC^GGTGTCCCAAGGCACCGGGCCGGGTCCT 

CGTCCACACATCGGTATCCCCAAGCCCAGACAACCTGCGTCGCTTTGCCCTGGAACACGAGG 

CCTCGGACTTGGTGGAGATCTACCTCTGGAAGCTGGTAAAAGATGAGGAAACTGAGGCTCAG 

AGAGGTGAAGTACCTGGCCCAAGGCCACACAGCCAGAATCTTCCACTTGACTCAGATCAAGA 

AAGTCAGGAAGCAAGACTTCCAGAAAGAGGCACAGCACTTCCGACTGCTCGCTGGCCCCCAC 

GAAGGTCACTGGAACGTCTTCCTAGCCCAGACCCTGGAGCTGAAGGTCACGGCCAGTCCAGA 

CAAAGTGACCAAGACATAACAAAGACCTAACAGTTGCAGATATGAGCTGTATAATTGTTGTT 

ATTATATATTAATAAATAAGAAGTTGCATTACCCTCAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE Hd 

></usr/seqdb2 /sst/DNA/Dnaseqs . min/ss . DNA64902 
xsubunit 1 of.l, 451 aa, 1 stop 
><MW: 49675, pi: 7.15, NX(S/T): 1 

MVPEVRVLSSIiGIALLWFPLDSHARARPDMFCLFHGKRYSPGESWHPYLEPQGLMYCLRCT 

CSEGAHVSCYRLHCPPVHCPQPVTEPQQCCPKCVEPHTPSGLRAPPKSCQHNGTMYQHGEIP 

SAHELFPSRLPNQCVLCSCTEGQIYCGLTTCPEPGCPAPLPLPDSCCQACKDEASEQSDEED 

SVQSLHGVRHPQDPCSSDAGRKRGPGTPAPTGLSAPLSFIPRHFSPKGAGSTTVKIVLKEKH 

KKACVHGGKTYSHGEVWHPAFRAFGPLPCILCTCEDGRQDCQRVTCPTEYPCRHPEKVAGKC 

CKICPEDKADPGHSEISSTRCPKAPGRVLVHTSVSPSPDNLRRFALEHEASDLVEIYLWKLV 

KDEETEAQRGEVPGPRPHSQNLPLDSDQESQEARLPERGTALPTARWPPRRSLERLPSPDPG 
AEGHGQSRQSDQDITXT 

Signal peptide: 

amino acids 1-25 
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PCT/US99/20I11 



FIGURE 87 

CTAGCCTGCGCCAAGGGGTAGTGAGACCGCGCGGCAACAGCTTGCGGCTGCGGGGAGCTCCC 
GTGGGCGCTCCGCTGGCTGTGCAGGCGGCCATGGATTCCTTGCGGAAAATGCTGATCTCAGT 
CGCAATGCTGGGCGCAGGGGCTGGCGTGGGCTACGCGCTCCTCGTTATCGTGACCCCGGGAG 
AGCGGCGGAAGCAGGAAATGCTAAAGGAGATG CCACTG CAGGAC CCAAGGAGCAGGGAGGAG 
GCGGCCAGGACCCAGCAGCTATTGCTGGCCACTCTGCAGGAGGCAGCGACCACGCAGGAGAA 
CGTGGCCTGGAGGAAGAACTGGATGGTTGGCGGCGAAGGCGGCGCCAGCGGGAGGTCACCGS 
GAGACCGGACTTGCCTCCGTGGGCGCCGGACCTTGGCTTGGGCGCAGGAATCCGAGGCAGCC 
TTT CTCCTTCGTGGG CC CAGCGGAGAGT CCGGAC CGAG AT AC CATG CCAGG ACT CT CCGGGG 

TCCTGTGAGCTGCCGTCGGGTGAGCACGTTTCCCCCAAACCCTGGACTGACTGCTTTAAGGT 
C CG CAAGGCGGG CCAG GG CCGAGA CG CGAGT CGGATGT GGTG AACTG AAAGAACCAATAAAA 

TC^TGTTCCTCCAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA^ 
AAAAAAAAAAA 
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FIGURE 88 

MDSLRKMLISVAMLGAGAGVGYALLVIVTPGERRKQEMLKEMPLQDPRSREEAARTQQLLLA 
TLQEAATTQENVAWRKNWMVGGEGGASGRS P 

Signal peptide: 

amino acids 1-18 



WO 00/12708 
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FIGURE S9 

CAGGAGAGAAGGCACCGCCCCCACCCCGCCTCCAAAGCTAACCCTCGGGCTTGAGGGGAAGA 
GG CTGACTGTACGTTCCTTCTACTCTGGCACCACTCTCCAGGCTGCCATGGGGCCCAGCACC 
CCTCTCCTCATCTTGTTCCTTTTGTCATGGTCGGGACCCCTCCAAGGACAGCAGCACCACCT 
TGTGG AGTACATGGAACGCCGACTAGC TGCTT TAGAGG AACGG CTGGC CCAGTG CCAGGACC 
AGAGTAGTCGGCATGC7GCTGAGCTGCGGGACTTCAAGAACAAGATGCTGCCACTGCTGGAG 
GTGGCAGAGAAGGAGCGGGAGGCACTCAGAACTGAGGCCGACACCAIICTCCGGGAGAGTGGA 
TCGTCTGGAGCGGGAGGTAGACTATCTGGAGACCCAGAACCCAGCTCTGCCCTGTGTAGAGT 
TTGATG AGAAGGTGACTG G AGG C C C TGGG ACCAAAGGCAAGGGAAGAAGGAATGAGAAGT AC 
GATATGGTGACAGACTGTGGCTACACAATCTCTCAAGTGAGATCAATGAAGATTCTGAAGCG 
ATTTGGTGGCCCAG CTGGTCTATGGAC CAAGGATCC ACTGGGG CAAA CAGAG AAGAT CTACG 
TGTTAGATGGGA CACAGAATG ACACAG CCTTTGTCTTC CCAAGG CTGCGT GACT TCAC C CTT 
GCCATGGCTGCCCGGAAAGCTTCCCGAGTCCGGGTGCCCTTCCCCTGGGTAGGCACAGGGCA 
GCTGGTATATGGTGG CTTT CTTTATTTTGCT CGG AGG C CTC CTGGAAGAC CTGG TGG AGGTG 
GTGAGATGGAGAACACTTTGCAG C TAAT CAAATT CCACCT GG CAAACCGAACAGTGGTGGAC 
AGCT CAGTATTC CC AG CAGAG GGG CTGAT CC CCCCCTACGGCTTGACAGC AG ACAC CTACAT 
CGAC CTGGTAG CTGAT GAGGAAGGTCTTTGGG CTGT CTATGC CACCCGGGAGGATGACAGGC 
ACTTGTGTCTGGCCAAGTTAGATCCACAGACACTGGACACAGAGCAGCAGTGGGACACACCA 
TGTCCCAGAGAGAATGCTGAGGCTGCCTTTGTCATCTGTGGGACCCTCTATGTCGTCTATAA 
CACCCGTCCTGCCAGTCGGGCCCGCATCC^GTGCTCCTTTGATGCCAGCGGCACCCTGACCC 
CTGAACGGGCAG CACT CC CTT ATTTT CCC CGCAGATATGGT GCCCATGCCAG CC T C CG CTAT 
AACC CCCGAGAACGCCAGCT CTATGCCTGGGATGATGGCTACCAGATTGTCTATAAGCTGGA 
GATGAGGAAGAAAGAGGAGGAGGTTT^GGAGCTAGCCTTGTTTTTTGCATCTTTCTCACTC 
CCATACATTTATATTATATCCCCACTAAATTTCTTGTTCCTCATTCTTCAAATGTGGGCCAG 
TTGTGGCTCAAATCCTCTATATTTTTAGCCAATGGCAATCAAATTCTTTCAGCTCCTTTGTT 
T C AT ACGGAACTCCAGATC CTGAGTAATC CTTTTAGAGCC CG AAGAGTCAAAAC C CTC AATG 
TTCCCTCCTGCTCTCCTGCCCCATGTCAACAAATTTCAGGCTAAGGATGCCCCAGACCCAGG 
G CTCTAACCTTGTATG CGGGCAGG CC CAGGGAG CAGG C AG CAGTGTTCTTCCCCTCAGAGTG 

ACTTGGGGAGGGAGAAATAGGAGGAGACGTCCAGCTCTGTCCTCTCTTCCTCACTCCTCCCT 
TCAGTGTCCTGAGGAAC^GGACTTTCTCCACATTGTTTTGTATTGCAACATTTTGCATTAAA 
AG G AAAAT C C AC AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 90 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA64905 
<subunit l of l, 406 aa, l stop 
<MW: 46038, pi: 6.50, NX<S/T); 2 

MGPSTPLLILFLLSWSGPLQGQQHHLVEYMERRLAALEERIAQCQDQSSRHAAELRDFKNKM 
LPLLEVAEKEREALRTEADT I SGRVDRLERE VDYLETQNP ALPCVEFDEKVTGGPGTKGKGR 
RNEKYDMVTDCGYTISQTOSMKILKRFGGPAGLOTKDPLGQTEKIYVLDGTQNDTAFVFPRL 
RDFTLAMAARKASRVRVPFPWGTGQLVTGGFLYFARRPPGRPGGGGEMEISrrLQLIKFHLAN 
RTVVDSSVFPAEGLIPPYGLTADTYIDLVADEEGLWAVYATREDDRHLCLAKLDPQTLDTEQ 
QWDT P C P RENAE AAF V I CGT L YWYNTRP AS RARI QCS FDASGTLT PE RAAL P YF P RR YG AH 
ASLRYNPRERQLYAWDDGYQIVYKLEMRKKEEEV 

Important features: 
Signal peptide: 

amino acids 1-21 

N-glycosylation sites. 

amino acids 177-180, 248-251 



WO00/l2708 PCI7US99/201U 



FIGIJRF Q1 

GACAGCTGTGTCTCGATGGAGTAGACTCTCAGAACAGCGCAGTTTGCCCTCCGCTCACGCAG 
AGCCTCTCCGTGGCTTCCGCACCTTGAGCATTAGGCCAGTTCTCCTCTTCTCTCTAATCCAT 
CCGTCACCTCTCCTGTCATCCGTTTCCATGCCGTGAGGTCCATTCACAGAACACATCCATGG 

ctctcatgctcagtttggttctgagtctcctc^gctgggatcagggcagtggcaggtSSt 

GGGCCAGACAAGCCTGTCCAGGCCTTGGTGGGGGAGGACGCAGCATTCTCCTGTTTCCTGTC 

TCCTAAGACCAATGCAGAGGCCATGGAAGTGCGGTTCTTCAGGGGCCAGTTCTCTAGCGTGG 

TCCACCTCTACAGGGACGGGAAGGACCAGCCATTTATGCAGATGCCACAGTATCAAGGCAGG 

ACAAAACTGGTGAAGGATTCTATTGCGGAGGGGCGCATCTCTCTGAGGCTGGAAAACATTAC 

TGTGTTGGATGCTGGCCTCTATGGGTGCAGGATTAGTTCCCAGTCTTACTACCAGAAGGCCA 

TCTGGGAGCTACAGGTGTCAGCACTGGGCTCAGTTCCTCTCATTTCCATCACGGGATATGTT 

GATAGAGACATCCAGCTACTCTGTCAGTCCTCGGGCTGGTTCCCCCGGCCCACAGCGAAGTG 

GAAAGGTCCACAAGGACAGGATTTGTCCACAGACTCCAGGACAAACAGAGACATGCATGGCC 

TGTTTGATGTGGAGATCTCTCTGACCGTCCAAGAGAACGCCGGGAGCATATCCTGTTCCATG 

CGGCATGCTCATCTGAGCCGAGAGGTGGAATCCAGGGTACAGATAGGAGATACCrTTTTCGA 

GCCTATATCGTGGCACCTGGCTACCAAAGTACTGGGAATACTCTGCTGTGGCCTATTTTTTG 

GCA^GTTGGACTGAAGATTTTCTTCTCCAAATTCCAGTGGAAAATCCAGGCGGAACTGGAC 

TGGAGAAGAAAGCACGGACAGGCAGAATTGAGAGACGCCCGGAAACACGCAGTGGAGGTGAC 

TCTGGATCCAGAGACGGCTCACCCGAAGCTCTGCGTTTCTGATCTGAAAACTGTAACCCATA 

GAAAAGCTCCCCAGGAGGTGCCTCACTCTGAGAAGAGATTTACAAGGAAGAGTGTGGTGGCT 

TCTCAGAGTTTCCAAGCAGGGAAACATTACTGGGAGGTGGACGGAGGACACAATAAAAGGTG 

GCGCGTGGGAGTGTGCCGGGATGATGTGGACAGGAGGAAGGAGTACGTGACTTTGTCTCCCG 

ATCATGGGTACTGGGTCCTCAGACTGAATGGAGAACATTTGTATTTCACATTAAATCCCCGT 

TTTATCAGCGTCTTCCCCAGGACCCCACCTACAAAAATAGGGGTCTTCCTGGACTATGAGTG 

TGGGACCATCTCCTTCTTCAACATAAATGACCAGTCCCTTATTTATACCCTGACATGTCGGT 

TTGAAGGCTTATTGAGGCCCTACATTGAGTATCCGTCCTATAATGAGCAAAATGGAACTCCC 

ATAGTCATCTGCCCAGTCACCCAGGAATCAGAGAAAGAGGCCTCTTGGCAAAGGGCCTCTGC 

AATCCCAGAGACAAGCAACAGTGAGTCCTCCTCACAGGCAACCACGCCCTTCCTCCCCAGGG 

GTGAAATGTaSGATGAATCACATCCCACATTCTTCTTTAGGGATATTAAGGTCTCTCTCCCA 

GATCCAAAGTCCCGCAGCAGCCGGCCAAGGTGGCTTCCAGATGAAGGGGGACTGGCCTGTCC 

ACATGGGAGTCAGGTGTCATGGCTGCCCTGAGCTGGGAGGGAAGAAGGCTGACATTACATTT 

AGTTTGCTCTCACTCCATCTGGCTAAGTGATCTTGAAATACCACCTCTCAGGTGAAGAACCG 

TCAGGAATTCCCATCTCACAGGCTGTGGTGTAGATTAAGTAGACAAGGAATGTGAATAATGC 

TTAGATCTTATTGATGACAGAGTGTATCCTAATGGTTTGTTCATTATATTACACTTTCAGTA 
AAAAAA 
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FIGURE 92 

MALMLSLVLSLLKLGSGQWQVFGPDKPVQALVGEDAAFSCFLSPKTNAEAMEVRFFRGQFSS 

WHLYRDGKDQPFMQMPQYQGRTKLVKDSIAEGRISLELENITVLDAGLYGCRISSQSYYQK 

AIWELQVSALGSVPLIS ITGYVDRDIQLLCQSSGWFPRPTAKWKGPQGQDLSTDSRTNRDMH 

GLFDVEISLTVQENAGSISCSMRHAHLSREVESRVQIGDTFFEPISWHLATKVLGILCCGLF 

FGIVGLKIFFSKFQWKIQAELDWRRKHGQAELRDARKHAVEVTLDPETAHPKLCVSDLKTVT 

HRKAPQEVPHSEKRFTRKSWASQSFQAGKHYWEVDGGHNKRWRVGVCRDDVDRRKEYVTLS 

PDHGYWVLRLNGEHLYFTLNPRFISVFPRTPPTKIGVFLDYECGTISFFNINDQSLIYTLTC 

RFEGLLRPYIEYPSYNEQNGTPIVICPVTQESEKEASWQRASAIPETSNSESSSQATTPFLP 
RGEM 

Signal peptide: 

amino acids 1-17 

Transmembrane domain: 

amino acids 239-255 
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FIGURE 93 

GCGATGGTGCGCCCGGTGGCGGTGGCGGCGGCGGTTGCGGAGGCTTCCTTGGTCGGATTGCA 
ACGAGGAGAAGATGACTGACCAACCG ACTGGC TGAATGAATG AATGG CGGAG CC GAGCGCGC 
CMGAGGAGCCTGCCGAGCCTGGGCGGCCTCGCCCTGTTGTGCTGCGCCGCCGCCGCCGCCG 
CCGTCGCCTCAGCCGCCTCGGCGGGGAATGTCACCGGTGGCGGCGGGGCCGCGGGGCAGGTG 
GACGCGTCGCCGGGCCCCGGGTTGCGGGGCGAGCCCAGCCACCCCTTCCCTAGGGCGACGGC 
TCCCACGGCCCAGGCCCCGAGGACCGGGCCCCCGCGCGCCACCGTCCACCGACCCCTGGCTG 
CGACTT CT C CAGCCCAGTCC CCGGAG AC CACC C CTCTTTGGG CG ACTG CTGGACCCT CTTCC 

ACCACCTTTCAGGCGCCGCTCGGCCCCTCGCCGACCACCCCTCCGGCGGCGGAACGCACTTC 

GACCACCTCTCAGGCGCCGACCAGACCCGCGCCGACCACCCTTTCGACGACCACTGGCCCGG 

CGCCGACCACCCCTGTAGCGACCACCGTACCGGCGCCCACGACTCCCCGGACCCCGACCCCC 

GATCTCCCCAGCAGCAGCAACAGCAGCGTCCTCCCCACCCCACCTGCCACCGAGGCCCCCTC 

TTCGCCTCCTCCAGAGTATGTATGTAACTGCTCTGTGGTTGGAAGCCTGAATGTGAATCGCT 

GCAACCAGACCACAGGGCAGTGTGAGTGTCGGCCAGGTTATCAGGGGCTTCACTGTGAAACC 

TGCAAAGAGGGCTTTTACCTAAATTACACTTCTGGGCTCTGTCAGCCATGTGACTGTAGTCC 

AC ATGGAG CTCT CAG C AT ACCGTGCAACAGGTAAGCAAC AGAGGGT GGAACTGAAGTTTATT 

TTATTTTAGCAAGGGAAAAAAAAAGGCTGCTACTCTCAAGGACCATACTGGTTTAAACAAAG 

GAGG AT G AGGGT CATAGATTTACAAAATATTTTATATACTTTTATT CT CT TA CTTTATATGT 

TATATTTAATGTCAGGATTTAAAAACATCTAATTTACTGATTTAGTTCTTCAAAAGCACTAG 

AGT CG C CAATTTTTCTCTGGGAT AATTTCTGTAAATTTCATGGG AAAAAATT ATTGAAGAAT 

AAATCTGCTTTCTGGAAGGGCTTTCAGGCATGAAACCTGCTAGGAGGTTTAGAAATGTTCTT 

ATGTTTATTAATATACCATTGGAGTTTGAGGAAATTTGTTGTTTGGTTTATTTTTCTCTCTA 

ATCAAAATTCTACATTTGTTTCTTTGGACATCTAAAGCTTAACCTGGGGGTACCCTAATTTA 

TT TAACTAGTGGTAAGTAGACTGGTTTTACTCTATTTAC CAGTACATTTTTGAGAC CAAAAG 

TAGATTAAGCAGGAATTATCTTTAAACTATTATGTTATTTGGAGGTAATTTAATCTAGTGGA 

ATAATGTACTGTTATCTAAG CAT TTGC CTT GT ACTGCACTGAAAGT AATTATTCTTTGACCT 

TATGTGAGGCACTTGGCTTTTTGTGGACCCCAAGTCAAAAAACTGAAGAGACAGTATTAAAT 

AATGAAAAAAATAATGACAGGTTATACTCAGTGTAACCTGGGTATAACCCAAGATCTGCTGC 

CACTTACGAGCTGTGTTCCTTGGGCAAGTAATTTCCTTTCACrGAGCTTGTTTCTTCTC^ 

GTTGTTGTGAAGATTAAATGAGTTGATATATATAAAATGCCTAGCACATGTCACTCAATAAA 

TT CT GGTT TGTTTTAATTT CAAAGGAAT ATTATGGACTGAAATGAGAGAACATGTTTTAAGA 

ACTTTT AG CT CCTTGACAAAGAAG TGCTTTATACTTTAG CACTAAATATTTTAAATGCTTTA 

TAAATGATATTATACTGTTATGGAATATTGTATCATATTGTAGTTTATTAAAAATGTAGAAG 

AGGCTGGGCGCGGTGGCTCACGCCTGTAATCCTAGCACTTTGGGAGGCCAAGGCGGGTGGAT 

CACTTGAGGCCAGGAGTTCTAGATGAGCCTGGCCAGCACAGTGAAACCCCGTCTCTACTAAA 

AAT ACAAACAAATTAGCTGGGCGTGGTGGCAC AC AC CT GTAGTC CC AG CT ACT CGGGAGG CT 

GAGG CAGGAGAATCGGTTGAACCCGGGAGGTGGAGGTTG CAG TGAGCTGAGATCGCGCCACT 

GCACTCCAGCCTGGTGAGAGAGGGAGACTCTGTCTTAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 94 

></usr/seqdb2/sst/DNA/Dnaseqs .min/ss .DNA64952 
xsubunit 1 of 1, 258 aa, 1 stop 
><MW: 25716, pi: 8.13, NX(S/T): 5 

MRSLPSLGGIALLCCAAAAAAVASAASAGNVTGGGGAAGQVDASFGPGLRGEPSHPFPRATA 

PTAQAPRTGPPRATVHRPLAATSPAQSPETTPLWATAGPSSTTFQAPLGPSPTTPPAAERTS 

TTSQAPTRPAPTTLSTTTGPAPTTPVATTVPAPTTPRTPTPDLPSSSNSSVLPTPPATEAPS 

SPPPEYVCNCSWGSLNVNRCNQTTGQCECRPGYQGLHCETCKEGFYLNYTSGLCQPCDCSP 
HGALSIPCNR 

Important features of the protein: 
Signal peptide: 

amino acids 1-25 

N-glycosylation sites. 

amino acids 30-33, 172-175, 195-198, 208-211. 235-238 

EGF-like domain cysteine pattern signature. 

amino acids 214-226. 
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FIGURE 95 

TGCGGCGCAGTGTAGACCTGGGAGG^^GCGGCCTGCTGCTGGCTGCTTTTCTGGCTTTGG 
TCTCGGTGCCCAGGGCCCAGGCCGTGTGGTTGGGAAGACTGGACCCTGAGCAGGTTCTTGGG 
CCCTGGTACGTGCTTGCGGTGGCCTCCCGGGAAAAGGGCTTTGCCATGGAGAAGGACATGAA 
GAACGTCGTGGGGGTGGTGGTGACCCTCACTCCAGAAAACAACCTGCGGACGCTGTCCTCTC 
AGCACGGGCTGGGAGGGTGTGACCAGAGTGT CATGGAC CTGATAAAGCGAAACTCCGGATGG 
GTGTTTGAGAATCCCTCAATAGGCGTGCTGGAGCTCTGGGTGCTGGCCACCAACTTCAGAGA 
CTATGCCATCATCTTCACTCAGCTGGAGTTCGGGGACGAGCCCTTCAACACCGTGGAGCTGT 
AC AGT CTGACGGAG AC AG CC AGCCAGGAGG C C ATGG GGCT CTT CACCAAGTGGAGCAGGAGC 
CTGGGCTT C CTGT CACAGTTAGCAGG C C C AGC TG CAGAAGGACCTCAC CTGTG CTCACAAGAT 
CCTTCTGTGAGTGCTGCGTCCCCAGTAGGGATGGCGCCCACAGGGTCCTGTGACCTCGGCCA 

GTGTCCACCCACCTCGCTCAGCGGCTCCCGGGGCCCAGCACCAGCTCAGAATAAAGCGATTC 
CACAGCA 
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FIGURE 96 

MGGLLU^FIALVSVPRAQAVWLGRLDPEQ 

LTPENl^RTLSSQHGLGGCDQSVMDLIKRNSGWVFENPSIGVLELWVLATNFRDYAIIFTQL 
EFGDEPFNTVELYSLTETASQEAMGLFTKWSRSLGFLSQ 

Signal peptide: 

amino acids 1-20 
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FIGURE 97 

AACAGACGTTCCCTCGCGGCCCTCSGCACCTCTAACCCCAGAC^SCTGCTGCTGCTGCTGCC 

CCTGCTCTGGGGGAGGGAGAGGGCGGAAGGACAGACAAGTAAACTGCTGACGATGCAGAGTT 

CCGTGACGGTGCAGGAAGGCCTGTGTGTCCATGTGCCCTGCTCCTTCTCCTACCCCTCGCAT 

GGCTGGATTTACCCTGGCCCAGTAGTTCATGGCTACTGGTTCCGGGAAGGGGCCAATACAGA 

CCAGGATGCTCCAGTGGCCACAAACAACCCAGCTCGGGCAGTGTGGGAGGAGACTCGGGACC 

GATTCCACCTCCTTGGGGACCCACATACCAAGAATTGCACCCTGAGCATCAGAGATGCCAGA 

AGAAGTGATGCGGGGAGATACTTCTTTCGTATGGAGAAAGGAAGTATAAAATGGAATTATAA 

ACATCACCGGCTCTCTGTGAATGTGACAGCCTTGACCCACAGGCCCAACATCCTCATCCCAG 

GCACCCTGGAGTCCGGCTGCCCCCAGAATCTGACCTGCTCTGTGCCCTGGGCCTGTGAGCAG 

GGGACACCCCCTATGATCTCCTGGATAGGGACCTCCGTGTCCCCCCTGGACCCCTCCACCAC 

CCGCTCCTCGGTGCTCACCCTCATCCCACAGCCCCAGGACCATGGCACCAGCCTCACCTGTC 

AGGTGACCTTCCCTGGGGCCAGCGTGACCACGAACAAGACCGTCCATCTCAACGTGTCCTAC 

CCGCCTCAGAACTTGACCATGACTGTCTTCCAAGGAGACGGCACAGTATCCACAGTCTTGGG 

AAATGGCTCATCTCTGTCACTCCCAGAGGGCCAGTCTCTGCGCCTGGTCTGTGCAGTTGATG 

CAGTTGACAGCAATCCCCCTGCCAGGCTGAGCCTGAGCTGGAGAGGCCTGACCCTGTGCCCC 

TCACAGCCCTCAAACCCGGGGGTGCTGGAGCTGCCTTGGGTGCACCTGAGGGATGCAGCTGA 

ATTCACCTGCAGAGCTCAGAACCCTCTCGGCTCTCAGCAGGTCTACCTGAACGTCTCCCTGC 

AGAGCAAAGCCACATCAGGAGTGACTCAGGGGGTGGTCGGGGGAGCTGGAGCCACAGCCCTG 

GTCTTCCTGTCCTTCTGCGTCATCTTCGTTGTAGTGAGGTCCTGCAGGAAGAAATCGGCAAG 

GCCAGCAGCGGGCGTGGGAGATACGGGCATAGAGGATGCflAACGCTGTCAGGGGTTCAGCCT 

CTCAGGGGCCCCTGACTGAACCTTGGGCAGAAGACAGTCCCCCAGACCAGCCTCCCCCAGCT 

TCTGCCCGCTCCTCAGTGGGGGAAGGAGAGCTCCAGTATGCATCCCTCAGCTTCCAGATGGT 

GAAGCCTTGGGACTCGCGGGGACAGGAGGCCACTGACACCGAGTACTCGGAGATCAAGATCC 

ACAGASgAGAAACTGCAGAGACTCACCCTGATTGAGGGATCACAGCCCCTCCAGGCAAGGGA 

GAAGTCAGAGGCTGATTCTTGTAGAATTAACAGCCCTCAACGTGATGAGCTATGATAACACT 

ATGAATTATGTGCAGAGTGAAAAGCACACAGGCTTTAGAGTCAAAGTATCTCAAACCTGAAT 

CCACACTGTGCCCTCCCTTTTATTTTTTTAACTAAAAGACAGACAAATTCCTA 
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FIGURE 

MLLLIJ.PLLWGRERAEGQTSKLLTMQSSVTVQEGLCVHVPCSFSYPSHGWIYPGPVVHGYWF 
REGANTDQDAPVATNNPARAVWEETRDRFHLLGD PHTKNCTLS I RDARRS DAGRYFFRMEKG 

SIKWNYKHHRLSVNVTALTHRPNILIPGTLESGCPQNLTCSVPWACEQGTPPMISWIGTSVS 
PUDPSTTRSSVLTLIPQPQDHGTSLTCQVTFPGASVTTNKTVHLOTSYPPQNLTMTVFQGDG 
TVSTVLGNGSSLSLPEGQSLRLVCAVDAVDSNPPARLSLSWRGLTLCPSQPSNPGVLELPWV 
HLRDAAEF TCRAQNPLGSQQVYLNVSLQ SKATS GVTQG WGGAGATJ^VFLS FCVI FWVRS 

CRKKSARPAAGVGDTGIEDANAVRGSASQGPLTEPWAEDSPPDQPPPASARSSVGEGELQYA 
SLSFQMVKPWDSRGQEATDTEYSEIKIHR 

Signal peptide: 

amino acids 1-15 

Transmembrane domain: 

amino acids 351-370 
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FIGURE 99 

GACGCCCAGTGACCTGCCGAGGTCGGCAGCACAGAGCTCTGGAGATGAAGACCCTGTTCCTG 
GGTGTCACGCTCGGCCTGGCCGCTGCCCTGTCCTTCACCCTGGAGGAGGAGGATATCACAGG 
GACCTGGTACGTGAAGGCCATGGTGGTCGATAAGGACTTTCCGGAGGACAGGAGGCCCAGGA 
AGGTGTCCC CAGTGAAGGTGACAG CC CTGG G CGGTGGGAAGTTG GAAGCCACGTTCACCTTC 
ATGAGGGAGGAT CGGTGC AT C C AG AAGAAAAT C CTG AT G CGG AAGACGGAGG AG C CTGGCAA 
ATACAGCGCCTATGGGGGCAGGAAGCTCATGTACCTGCAGGAGCTGCCCAGGAGGGACCACT 
ACATCTTTTACTGCAAAGACCAGCACCATGGGGGCCTGCTCCACATGGGAAAGCTTGTGGGT 
AGGAATT CTGAT AC CAAC CGGG AGGC CCTGGAAG AATTTAAGAAATTGGT G CAG CG CAAGGG 
ACTCTCGGAGGAGGACATTTTCACGCCCCTGCAGACGGGAAGCTGCGTTCCCGAACACTAGG 
CAGCCCCCGGGTCTGCACCTCCAGAGCCCACCCTACCACCAGACACAGAGCCCGGACCACCT 
GGACCTACCCTCCAGCCATGACCCTTCCCTGCTCCCACCCACCTGACTCCAAATAAAGTCCT 
TTTGCCCCAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 100 

</usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA65404 
oubunit \ of l, 170 aa,.l stop 
<MW: 19457, pi: 9.10, NX(S/T): 0 
^TLFLGVTLGLAAALSFTLEEEDITGTWYVKAMVVD^ 

EATFTFMREDRCIQKKILMRKTEEPGKYSAYGGRKLMYLQELPRRDHYIFYCKDQHHGGLLH 
MGKLVGRNSDTNREALEEFKKLVQRKGLSEEDIFTPLQTGSCVPEH 

Important features: 
Signal peptide: 

amino acids 1-17 
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FIGURE 101 

GTTC CGCAGATGCAGAGGTTGAGGTGGC TG C GGGACTGGAAG TC ATCGGG CAGAGGT CT C AC 
AGCAGCCAAGGAACCTGGGGCCCGCTCCTCCCCCCTCCAGGCCATOAGGATTCTGCAGTTAA 
TCCTGCTTGCTCTGGCAACAGGGCTTGTAGGGGGAGAGACCAGGATCATCAAGGGGTTCGAG 
TGCAAGCCTCACTCCCAGCCCTGGCAGGCAGCCCTGTTCGAGAAGACGCGGCTACTCTGTGG 
GGCGACGCTCATCGCCCCCAGATGGCTCCTGACAGCAGCCCACTGCCTCAAGCCCCGCTACA 
TAGTTCACCTGG GGCAGCACAAC CTC CAGAAGGAGGAGGGCTGTGAG C AGAC CCGGACAGCC 
ACTGAGTCCTTCCCCCACCCCGGCTTCAACAACAGCCTCCCCAACAAAGACCACCGCAATGA 
CATCATGCTGGTGAAGATGGCATCGCCAGTCTCCATCACCTGGGCTGTGCGACCCCTCACCC 
TCTCCTCACGCTGTGTCACTGCTGGCACCAGCTGCCTCATTTCCGGCTGGGGCAGCACGTCC 
AGCCCCCAGTTACGCCTGCCTCACACCTTGCGATGCGCCAACATCACCATCATTGAGCACCA 
GAAGTG TG AG AACG C C TAC CC CGGCAACAT CACAGACAC CATGGTG TGTGCCAG CG TG CAGG 

AAGGGGGCAAGGACTCCTGCCAGGGTGACTCCGGGGGCCCTCTGGTCTGTAACCAGTCTCTT 
CAAGGCATTATCTCCTGGGGCCAGGATCCGTGTG CGATCACC CGAAAGCCTGGTGTCTACAC 
GAAAGTCTGCAAATATGTGGACTGGATCCAGGAGACGATGAAGAACAATTAGACTGGACCCA 
CCCACCACAGCCCATCACCCTCCATTTCCACTTGGTGTTTGGTTCCTGTTCACTCTGTTAAT 
AAGAAACC CTAAGCCAAGACC CTCT ACGAACATT CTTTGGGC CTC C TGGACTAC AGGAGATG 
CTGTCACTTAATAATCAACCTGGGGTTCGAAATCAGTGAGACCTGGATTCAAATTCTGCCTT 
GAAATATTGTGACTCTGGGAATGACAACACCTGGTTTGTTCTCTGTTGTATCCCCAGCCCCA 
AAGACAG CTCCT GG CCATAT AT CAAGGTTTC AATAAATAT TT GC TAAATGAAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 102 

</usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA65405 
oubunit 1 of l, 250 aa, 1 stop 
<MW: 27466, pi: 8.87, NX(S/T) : 4 

MRILQLILIALATGLVGGETRIIKGFECKPHSQPWQAALFEKTRLLCGATLIAPRWLLTAAH 
CLKPRYIVHLGQHNLQKEEGCEQTRTATESFPHPGFNNSLPNKDHRNDIMLVKMASPVSITW 
AVRPLTLSSRCVTAGTSCLISGWGSTSSPQLRLPHTLRCANITIIEHQKCENAYPGNITDTM 
VC^VQEGGKDSCQGDSGGPLVCNQSLQGIISWGQDPCAITRKPGVn'KVCKYVDWIQETM^ 

Important features: 
Signal peptide: 

amino acids 1-18 

Serine proteases, trypsin family, histidine active site, 
amino acids 58-63 

N-glycosylation sites. 

amino acids 99-102, 165-168, 181-184, 210-213 

Glycosaminoglycan attachment site. 

amino acids 145-148 

Kringle domain proteins. 

amino acids 197-209, 47-64 

Serine proteases, trypsin family, histidine protein 

amino acids 199-209, 47-63, 220-243 

Apple domain proteins 

amino acids 222-249, 189-222 
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FIGURE 103 

GAGCAGTGTTCTGCTGGAGCCGATCCCAAAAACCATGCATTTCTTATTCAGA 
TCTTTTATCTGTGGGGCCTTTTTACTGCTCAGAGACAAAAGAAAGAGGAGAGCACCGAAGAA 
GTGAAAATAGAAGTTTTGCATCGTCCAGAAAACTGCTCTAAGACAAGCAAGAAGGGAGACCT 
ACTAAATGCCCATTATGACGGCTACCTGGCTAAAGACGGCTCGAAATTCTACTGCAGCCGGA 
CACAAAATGAAGGC CACC CC AAATGG TTTG TT CT TGGTGTTGGG CAAGTCATAAAAGGCCTA 
GACATTGCTATGACAGATATGTGC C CTGGAGAAAAG CG AAAAGT AGTTATACCCCCTT CATT 
TGCAT ACGGAAAGGAAGGCT ATGCAG AAGG CAAGATT C CACC GGATGCTACATTGATTTTTG 
AGATTGAACTTTATGCTGTGACCAAAGGACCACGGAGCATTGAGACATTTAAACAAATAG 
ATGGAC AATGACAGGCAG CT CTCTAAAG C CGAGATAAACCTCTACTTGCAAAGGGAATTT GA 
AAAAGATGAGAAGCCACGTGACAAGTCATATCAGGATGCAGTTTTAGAAGATATTTTTAAGA 
AG AATG AC CATGATGGTG ATGG CTTCATTT CT CCCAAGGAAT AC AATG TATACCAACACGAT 

GAACTASAGCATATTTGTATTTCTACTTTTTTTTTTTAGCTATTTACTGTACTTTATGTATA 
AAACAAAGTCACTTTTCTCCAAGTTGTATTTGCTATTTTTCCCCTATGAGAAGATATTTTGA 
TCT C CC CAATACATTGATTTTGG TATAAT AAATGTG AGGCTGTTTTGCAAACTTAAAAAAAA 
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA€5406 
<subunit 1 of l, 222 aa, 1 stop 
<MW: 25794, pi: 6.24, NX(S/T) : 1 
MPKTMHFLFRFIVFFYLWGLFTAQRQKKEESTEETO 

YLAKDGSKFYCSRTQNEGHPKWFVLGVGQVIKGLDIAMTDMCPGEKRKVVIPPSFAYGKEGY 
AEGKI P PDATLI FE IELYAVTKGPRS IETFKQIDMDNDRQLSKAE INLYLQREFEKDEKPRD 
KSYQDAVLEDIFKKNDHDGDGFI SPKEYNVYQHDEL 

Important features: 

Endoplasmic reticulum targeting sequence. 

amino acids 219-222 

N-glycosylation site. 

amino acids 45-48 

FKBP-type peptidyl -prolyl cis-trans isomerase 

amino acids 87-223, 129-142 

EF-hand calcium- binding domain proteins 

amino acids 202-214, 195-214 
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FIGURE 105 

CAGAA4TGCAGGGACCATTGCTTCTTCCAGGCCTCTGCTTTCTGCTGAGCCTCTTTGGAGCT 
GTGACTCAGAAAACCAAAACTTCCTGTGCTAAGTGCCCCCCAAATGCTTCCTGTGTCAATAA 
CACT CACTGCAC CTGC AACCATGGATATAC TT CTGGAT CTGGGCAG AAACTATT CACAT T C C 

CCTTGGAGACATGTAACGCCAGGCATGGTGGCTCGCGCCTGT^TCCCAGTTCTTTGGGAAG 
CC AAGG CAGGTGGATCACCTGAGGT CAGGAGTTTGAGAC GAG CCTG GC CAACAT AGTGAAAC 
CC CGTGTCT ACTAAAAATACAAAAAT CAGC CGGG CGTG GTGGTG CATC C CTG CAAT CCCAGT 
TACTCGGGAGGCTGAGGC AG GAGAAT CG CTTG AACT CAGGAGGC AG AAG TTG CAGTGAAC CC 
AGATCCTG CCATTG CA CT CCAG CATGGATGAC AG AGCAAG ACT C CGTCT CAAAAAGAAAAGA 
T AGT TT CTTGTTTC AT TT CGCG AC TG CC CT CT CAGTGTTT CCTGGG AT C CCCTC CCAAATAA 
AGTACTTATATTCTC 
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FIGURE 106 

MQGPLLLPGLCFLLSLFGAVTQKTKTSCAKCPPNASCVNNTHCTCNHGYTSGSGQKLFTFPL 
ETCNARHGGSRL 



Signal peptide: 

amino acids 1-18 
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FIGURE 107 

CAAGCAGGTCATCCCCTTGGTGACCTTCAAAGAGAAGCAGAGAGGGCAGAGGTGGGGGGCAC 

AGGGAAAGGGTGACCTCTGAGATTCCCCTTTTCCCCCAGACTTTGGAAGTGACCCACCATGG 

GG CTCAGCATCTTTTTGCTCCTGTGTGTTCTTGGGCTCAGCCAGGCAGCCACACCGAA^ 

TTCAATGGCACTGAGTGTGGGCGTAACTCACAGC CGTGGCAGGTGGGG CTGTTTGAGGGCAC 

CAGCCTGCGCTGCGGGGGTGTCCTTATTGACCACAGGTGGGTCCTCACAGCGGCTCACTGCA 

GCGGCAGCAGGTACTGGGTGCGCCTGGGGGAACACAGCCTCAGCCAGCTCGACTGGACCGAG 

CAGATCCGG C ACAGCGG CTT CT CTGTGAC C CATC C CGGCT AC CTGGGAGCCTCGACGAG CCA 

CGAGCACGACCTCCGGCTGCTGCGGCTGCGCCTGCCCGTCCGCGTAACCAGCAGCGTTCAAC 

CCCTGCCCCTGCCCAATGACTGTGCAACCGCTGGCACCGAGTGCCACGTCTCAGGCTGGGGC 

ATCACCAACCACCCACGGAACCCATTCCCGGATCTGCTCCAGTGCCTCAACCTCTCCATCGT 

CTCCCATGCCACCTGCCATGGTGTGTATCCCGGGAGAATCACGAGCAACATGGTGTGTGCAG 

GCGGCGTCCCGGGGCAGGATGCCTGCO^GGGTGATTCTGGGGGCCCCCTGGTGTGTGGGGGA 

GTCCTTCAAGGTCTGGTGTCCTGGGGGTCTGTGGGGCCCTGTGGACAAGATGGCATCCCTGG 

AG TC TACACCTATATTTGCAAGTATGTGGACTGG AT C CGGATG ATCATGAGG AACAACTGAC 

CTGTTTCCTCCACCrCCACCCCCACCCCTTAACTTGGGTACCCCTCTGGCCCTCAGAGCACC 

AATATCTCCTCCATCACTTCCCCTAGCTCCACTCTTGTTGGCCTGGGAACTTCTTGGAACTT 

TAACTC CTG CCAG CCCTT CT AAGAC C CACG AG CGGGGTGAGAGAAGTGTG CAATAGTCTGGA 

ATAAATATAAATGAAGGAGGGGCAAAAAAAAAAAAAA 
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FIGURE 108 

MGLS I FLLLCVLGLSQAATPKI FNGTECGRNSQPWQVGLFEGTSLRCGGVL I DHRWVLTAAH 
CSGSRYW^mLGEHSLSQLDWTEQIRHSGFSVTHPGYLGASTSHEmDLRLLRLRLPVRVTSSV 
QPLPLPNDCATAGTECHVSGWGITNHPRNPFPDLLQCLNLSIVSHATCHGVYPGRITSNMVC 
AGGVPGQDACQGDSGGPLVCGGVLQGLVSWGSVGPCGQDGIPGVYTYICKYVDWIRMIMRNN 

Signal peptide: 

amino acids 1-17 
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FIGURE 109 

GCGGCCACACGCAGCTAGCCGGAGCCCGGACCAGGCGCCTGTGCCTCCTCCTCGTCCCTCGC 
CGCGTCCGCGAAGCCTGGAGCCGGCGGGAGCCCCGCGCTCGCC&2GTCGGGCGAGCTCAGCA 
ACAGGTTCCAAGGAGGGAAGGCGTTCGGCTTGCTCAAAGCCCGGCAGGAGAGGAGGCTGGCC 
GAGATCAACCGGGAGTTTCTGTGTGAQCAGAAGTACAGTGATGAAGAGAACCTTCCAGAAAA 
GCTCACAGCCTTCAAAGAGAAGTACATGGAGTTTGACCTGAACAATGAAGGCGAGATTGACC 
TGATGTCTTTAAAGAGGATGATGGAGAAGCTTGGTGTCCCCAAGACCCACCTGGAGATGAAG 
AAGATGATCTCAGAGGTGACAGGAGGGGTCAGTGACACTATATCCTACCGAGACTTTGTGAA 
CATGATGCTGGGGAAACGGTCGGCTGTCCTCAAGTTAGTCATGATGTTTGAAGGAAAAGCCA 
ACGAGAGCAGCCCCAAGCCAGTTGGCCCCCCTCCAGAGAGAGACATTGCTAGCCTGCCCiga 
GGACCCCGCCTGGACTCCCCAGCCTTCCCACCCCATACCTCCCTCCCGATCTTGCTGCCCTT 
CTTGACACACTGTGATCTCTCTCTCTCTCATTTGTTTGGTCATTGAGGGTTTGTTTGTGTTT 
TCATCAATGTCTTTGTAAAGGACAAATTATCTGCCTTAAAGGGGCTCTGGGTCGGGGAATCC 
TGAGCCTTGGGTCCCCTCCCTCTCTTCTTCCCTCCTTCCCCGCTCCCTGTGCAGAAGGGCTG 
AT AT CAAAC CAAAAACTAGAGGGGG C AGGG C CAGGG CAGGGAGGCTT CCAGCCTGTGTTC CC 
CTCACTTGGAGGAACCAGCACTCTCCATCCTTTCAGAAAGTCTCCAAGCCAAGTfCAGGCTC 
ACTGACCTGGCTCTGACGAGGACCCCAGGCCACTCTGAGAAGACCTTGGAGTAGGGACAAGG 
CTGCAGGGCCTCTTTCGGGTTTCCTTGGACAGTGCCATGGTTCCAGTGCTCTGGTGTCACCC 
AGGACACAGCCACTCGGGGCCCCGCTGCCCCAGCTGATCCCCACTCATTCCACACCTCTTCT 
CAT C CTCAGTGATGTGAAGGTGGGAAGGAAAGG AG CTTGG CATTGGGAGCCCTTCAAGAAGG 
TACCAG AAGG AAC CCTC CAGT C CTG CTCT CTGG C CACACC TGTGCAGG CAGCTGAGAGGC AG 
CGTG CAGC C CTACTGTC C CTTACTGGGG CAGCAG AGGG CTTCGGAGGCAGAAGTGAGGCC TG 
GGGTTTGGGGGGAAAGGTCAGCTCAGTG CTGTT C CACCTTTTAGGGAGGATACTGAGGGG AC 
CAGGATGGGAGAATGAGGAGTAAAATG CT CACGG CAAAGT CAGCAG CACTGGTAAGCCAAGA 
CTGAGAAATACAAGGTTG CTTGT CT GACC CCAAT CTGCTTGAAAAAAAAAAAAAAAAAA 
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FIGURE 110 

MSGELSNRFQGGKAFGLLKARQERRLAE INREFLCDQKYSDEENLPEKLTAFKEKYMEFDLN 

NEGEIDLMSLKRI^EKLGVPKTHLEMKKMISEVTGGVSDTISYRDFTO 

MFEGKANESSPKPVGPPPERDIASLP 
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FIGURE 111A 

CGCGCTCCCCGCGCGCCTCCTCGGGCTCCACGCGTCTTGCCCCGCAGAGGCAGCCTCCTCCA 
GGAGCGGGGCCCTGCACACCATgGCCCCCGGGTGGGCAGGGGTCGGCGCCGCCGTGCGCGCC 
CGCCTGGCGCTGGCCTTGGCGCTGGCGAGCGTCCTGAGTGGGCCTCCAGCCGTCGCCTGCCC 
CACCAAGTGTACCTGCTCCGCTGCCAGCGTGGACTGCCACGGGCTGGGCCTCCGCGCGGTTC 
CTCGGGGCATCCCCCGCAACGCTGAGCGCCTTGACCTGGACAGAAATAATATCACCAGGATC 
ACCAAGATGGACTTCGCTGGGCTCAAGAACCTCCGAGTCTTGCATCTGGAAGACAACCAGGT 
CAGCGTCATCGAGAGAGGCGCCTTCCAGGACCTGAAGCAGCTAGAGCGACTGCGCCTGAACA 
AGAATAAG CTGCAAGT C CTT CC AGAATTGCTT TT C CAG AGCACG CCGAAGCT CACCAGACTA 
GATTTGAGTGAAAACCAGATCCAGGGGATCCCGAGGAAGGCGTTCCGCGGCATCACCGATGT 
GAAGAACCTG CAACTGGACAACAA CCACAT CAGCTG CATTGAAGATGG AGCCTT CCGAGCGC 
TGCGCGATTTGGAGAT CCTTAC CCTCAACAACAACAACATCAGTCGCATCCTGGTCACCAGC 
TTCAACCACATGCCGAAGATCCGAACTCTGCGCCTCCACTCCAACCACCTCTACTGCGACTG 
CCACCTGGCCTGGCTCTCGGATTGGCTGCGACAGCGACGGACAGTTGGCCAGTTCACACTCT 
GCATGGCTCCTGTGCATTTGAGGGGCTTCAACGTGGCGGATGTGCAGAAGAAGGAGTACGTG 
TGCCCAGCCCCCCACTCGGAGCCCCCATCCTGCAATGCCAACTCCATCTCCTGCCCTTCGCC 
CTGC ACGT G C AG CAATAACAT CGTGGACTGT CGAGGAAAGGGCTT GATGG AGATTCCTGC CA 
ACTTGCCG GAGGG CATCGT CGAAATACGC CTAGAAC AGAACT CCAT CAAAGC CATCCCTGCA 
GGAGCCTT CACC CAGTACAAG AAACTGAAG CGAATAGACAT CAG CAAG AATCAG AT AT CGGA 
TATTGCTCCAGATGCCTTCCAGGGCCTGAAATCACTCACATCGCTGGTCCTGTATGGGAACA 
AGATCACCGAGATTGCCAAGGGACTGTTTGATGGGCTGGTGTCCCTACAGCTGCTCCTCCTC 
AATGC CAACAAGATCAACTG CCT G CGGGTGAACACGTTTCAGGAC C TG CAGAAC CTCAACTT 
GCTGTCCCTGTATGACAACAAGCTGCAGACCATCAGCAAGGGGCTCTTCGCCCCTCTGCAGT 
CCATCCAGACACTCCACTTAGCCCAAAACCCATTTGTGTGCGACTGCCACTTGAAGTGGCTG 
GCCGACTAC CTC CAGGACAACC CCAT CGAGA CAAG CGGGG CC CG CTGCAGCAGCC CGCGCCG 
ACTCGCCAACAAGCGCATCAGCCAGATCAAGAGCAAGAAGTTCCGCTGCTCAGGCTCCGAGG 
ATTACCGCAGCAGGTTCAGCAGCGAGTGCTTCATGGACCTCGTGTGCCCCGAGAAGTGTCGC 
TGTGAGGGCACGATTGTGGACTGCTCCAACCAGAAGCTGGTCCGCATCCCAAGCCACCTCCC 
TG AATATGTGACCGAC CTGCGACTGAATGACAATGAGGTAT C TGTT CTGGAGGC CACTGGCA 
TCTTCAAGAAGTTGCCCAACCTGCGGAAAATAAATCTGAGTAACAATAAGATCAAGGAGGTG 
CGAGAGGGAG CTTT CGATGGAGCAGCCAGCGTG CAGGAGCTGAT GCTG ACAGGGAAC CAGCT 
GGAGACCGTGC^CGGGCGCGTGTTCCGTGGCCTCAGTGGCCTCAAAACCTTGATGCTGAGGA 
GTAACTTGAT CAGCTGTGTGAGTAATGACACCTTTG CCGGC CTGAG TT CGGTGAGACTGCTG 
TCCCTCTATGACMTCGGATC^CCACCATCACCCCTGGGGCCTTCACCACGCTTGTCTCCCT 
GTCCACCATAAACCTCCTGTCCAACCCCTTCAACTGCAACTGCCACCTGGCCTGGCTCGGCA 
AGTGGTTGAGGAAGAGGCGGATCGTCAGTGGGAACCCTAGGTGCCAGAAG CCATTTTTCCT C 
AAGGAGATTCCCATCCAGGATGTGGCCATCCAGG ACTTCACCTGTGATGG CAAC GAGGAGAG 
TAGCTGCCAGCTGAGCCCGCGCTGCCCGGAGCAGTGCACCTGTATGGAGACAGTGGTGCGAT 
GCAG CAACAAGG GGCT CC GCG CC CT CCCCAGAGG CATGCC CAAGGATGTG AC CGAGCTGTAC 
CTGGAAGGAAACCACCTAACAGCCGTGCCCAGAGAGCTGTCCGCCCTCCGACACCTGACGCT 
TATTGACCTGAGCAACAACAGCATCAGCATGCTGACCAATTACACCTTCAGTAACATGTCTC 
ACCTCTCCACTCTGATCCTGAGCTACAACCGGCTGAGGTGCATCCCCGTCCACGCCTTCAAC 
GGGCTGCGGTCCCTGCGAGTGCTAACCCTCCATGGCAATGACATTTCCAGCGTTCCTGAAGG 
CTCCTTCAACGACCTCACATCTCTTTCCCATCTGGCGCTGGGAACCAACCCACTCCACTGTG 
ACTGCAGTCTTCGGTGGCTGTCGGAGTGGGTGAAGGCGGGGTACAAGGAGCCTGGCATCGCC 
CGCTGCAGTAGCCCTGAGCCCATGGCTGACAGGCTCCTGCTCACCACCCCAACCCACCGCTT 
CCAGTGCAAAGGGCCAGTGGACATCAACATTGTGGCCAAATGCAATGCCTGCCTCTCCAGCC 
CGTGCAAGAATAACGGGACATGCACCCAGGACCCTGTGGAGCTGTACCGCTGTGCCTGCCCC 
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FIGURE 111ft 

TACAGC TACAAGGGCAAGGACTGCACTGTGCC CATCAACACC TGCATC CAG AAC C C CT GT C A 
GCATGGAGGCACCTGCCACCTGAGTGACAGCCACAAGGATGGGTTCAGCTGCTCCTGCCCTC 
TGGG CTTTGAGGGG CAGCGGTGTGAGATCAACC CAGATGACTGTGAGG ACAACG AC TG CGAA 
AACAATGC CAC CTGCGTGGACGGGATCAACAACTACGTGTGTATCTGTCCG CCTAACTACAC 
AGGT GAG C TATGCGACGAGGTG ATTGAC CACTGTGTGCCTGAGCTGAACCT CTGTC AG CATG 
AGGCCAAGTGCATCCCCCTGGACAAAGGATTCAGCTGCGAGTGTGTCCCTGGCTACAGCGGG 
AAGCTCTGTGAGACAGAC7UVTGATGACTGTGTGGCCCACAAGTGCCGCCACGGGGCCCAGTG 
CGTGGACACAATCAATGGCTACACATGCACCTGCCCCCAGGGCTTCAGTGGACCCTTCTGTG 
AACACCCCCCACCCATGGTCCTACTGCAGACCAGCCCATGCGACCAGTACGAGTGCCAGAAC 
GGGGCCCAGTGCATCGTGGTGCAGCAGGAGCCCACCTGCCGCTGCCCACCAGGCTTCGCCGG 
CCCCAGATGCGAGAAGCTCATCACTGTCAACTTCGTGGGCAAAGACTCCTACGTGGAACTGG 
CCTCCGCCAAGGTCCGACCCCAGGCCAACATCTCCCTGCAGGTGGCCACTGACAAGGACAAC 
GGCATC CTTCTCTACAAAGGAGAC AATGAC CC C CTGG CACTGGAGCTGT ACCAGGG CCACGT 
GCGGCTGGTCTATGACAGCCTGAGTT CCCCTC CAACCACAGTGTACAGTGTGGAGACAGTGA 
ATGATGGGCAGTTTCACAGTGTGGAGCTGGTGACGCTAAACCAGACCCTGAACCl'AGTAGTG 
GACAAAGGAACT C CAAAG AG CCTGGGGAAGCT CCAGAAG CAG CCAGCAGTGGG CAT CAACAG 
CCCCCTCTACCTTGGAGGC^TCCCCACCTCCACCGGCCTCTCCGCCTTGCGCCAGGGCACGG 
AC CGGC CT CTAGGCGG CTT C CACGGATGCATCCATGAGGTGCG CAT CAACAACG AG CTGCAG 
GACTTCAAGGCCCTCCCACCACAGTCCCTGGGGGTGTCACCAGGCTGCAAGTCCTGCACCGT 
GTGCAAGCACGGCCTGTGCCGCTCCGTGGAGAAGGACAGCGTGGTGTGCGAGTGCCGCCCAG 
GCTGGACCGGCCCACTCTGCGACCAGGAGGCCCGGGACCCCTGCCTCGGCCACAGATGCCAC 
CATGGAAAATGTGTGGCAACTGGGACCTCATACATGTGCAAGTGTGCCGAGGGCTATGGAGG 
GGACTTGTGTGACAACAAGAATGACT CT GC CAATGC CTGC TCAG C CTTCAAGTGTCAC CATG 
GGCAGTGCCACATCTCAGACCAAGGGGAGCCCTACTGCCTGTGCCAGCCCGGCTTTAGCGGC 
GAGCACTGCCAACAAGAGAATCCGTGCCTGGGAC AAGT AGT C CGAGAGGTGAT CCGCCGCCA 
GAAAGGTTATGCATCATGTGCC AC AG CCTC CAAGGTGC CCAT CATGGAATGT CGTGGGGGCT 
GTGGGCCCCAGTGCTGCCAGCCCACCCGCAGCAAGCGGCGGAAATACGTCTTCCAGTGCACG 
GACGGCTCCTCGTTTGTAGAAGAGGTGGAGAGACACTTAGAGTGCGGCTGCCTCGCGTGTTC 
CTAAGCCCCTGCCCGCCTGCCTGCCACCTCTCGGACTCCAGCTTGATGGAGTTGGGACAGCC 
ATGTGGGACCCCCTGGTGATTCAGCATGAAGGAAATGAAGCTGGAGAGGAAGGTAAAGAAGA 

AGAGAATATTAAGTATATTGTAAAATAAACAAAAAATAGAACTTAAAAAAAAAAAAAAAAAA 
AAAAAA 



WO 00/12708 



PCT/US99/20111 



FIGURE 113 

MAPGWAGVGAAVRAIUJUJU^^ 
AERLDLDRNNITRITKMDFAGLKNLRVL 

PELLFQSTPKLTRLDLSENQIQGIPRKAFRGITDVKNLQLDNNHISCIEDGAFRALRDLEIL 

TLNNNNISRILVTSFNHMPKIRTLRLHSNHLYCDCHLiAWLSDWI^QRRTV 

RGFNVADVQKKEYVCPAPHSEPPSCNi^SISCPSPCTCSNNIVDCRGKGLMEIPANLPEGIV 

EIRLEQNSIKAIPAGAFTQYKKLKRIDISKNQISDIAPDAFQGLKSLTSLVLYGNKITEIAK 

GLFDGLVSLQLLLLNANKINCLRVNTFQDLQNLNLLSLYDNKLCTISKGLFAPLQSIQTLHL 

AQNPFVCDCHLKWLADYLQDNPIETSGARCSSPRRIANKRISQIKSKKFRCSGSEDYRSR 

SECFMDLVCPEKCRCEGT IVDCSNQKLVRI PSHLPEYVTDLRLNDNEVS VLEATG I FKKLPN 

LRKINLSm^IKEVREGAFDGAASVQELMLTGNQLETVHGRVFRGLSGLKTLML^SmiSCV 

SND T F AGL S S VRLLSL YDNR I TT I T PGAFTTL VS LS T I NLLSNP FNCN CHLAWLGKWLRKRR 

IVSGNPRCQKPFFLKEIPIQDVAIQDFTCDGNEESSCQLSPRCPEQCTCMETWRCSNKGLR 

ALPRGMPKDVTELYLEGNHLTAVPRELSALRHLTLIDLSNNSISMLTNYTFSNMSHLSTLIL 

SYNRLRCI PVHAFNGLRSLRVLTLHGND I SS VPEGS FNDLTSLSHLALGTNPLHCDCSLiRWL 

SEWVKAGYKEPGIARCSSPEPMADRLLLTTPTHRFQCKGPVDINIVAKCNACLSSPCKNNGT 

CTQDPVELYRCACPYSYKGKDCTVPINTCIQNPCQHGGTCHLSDSHKDGFSCSCPLGFEGQR 

CEINPDDCEDNDCENNATCVDGINNYVCICPPNYTGELCDEVIDHCVPELNLCQHEAKCIPL 

DKGFSCECVPGYSGKLCETDNDDCVAHKCRHGAQCVDTINGYTCTCPQGFSGPFCEHPPPMV 

LLQTSPCDQYECQNGAQCIWQQEPTCRCPPGFAGPRCEKLITVNFVGKDSYVELASAKVRP 

QANISLQVATDKDNGIIJ^YKGDNDPLALELYQGHVRLVYDSLSSPPTTVYSVET^ 

VELVTLNQTLNLWDKGTPKSLGKLQKQPAVG INSPLYLGGI PTSTGLSALRQGTDRPLGGF 

HGC I H E VR I NNELQD FKAL P PQS LGVS F GC KS CT VC KHGL CRS VE KD S WCE CR PG WTG P LC 

DQEARDPCLGHRCHHGKCVATGTSYMCKCAEGYGGDLCDNKNDSANACSAFKCHHGQCHISD 

QGEPYCLCQPGFSGEHCQQENPCLGQWREVIRRQKGYASCATASKVP IMECRGGCGPQCCQ 

PTRS KRRKYVFQCTDGS S FVEE VERHLECGCLACS 

Signal peptide: 

amino acids 1-27 
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FIGURE 113 

GGATGCAGGACGCTCCCCTGAGCTGCCTGTCACCGACTAGGTGGAGCAGTGTTTCTTCCGCA 
GACTCAACTGAGAAGTCAGCCTCTGGGGCAGG CACCAGGAAT CTGC CTTTTCAGTTCTGTCT 
CCGGCAGGCTTTGAGGA^AAGGCTGCGGGCATTCTGACCCTCATTGGCTGCCTGGTCACAG 
GCG CCGAGTCCAAAATCTACAC TCGTTG CAAACTGG CAAAAATATT CT CG AGGG CTGG CCTG 
GACAATTACTGGGGCTTCAGCCTTGGAAACTGGATCTGCATGGCATATTATGAGAGCGGCTA 
CAACACCACAG C C CCGACGGTC CTGGATGACGG CAG C ATCGACTATGG CATCTTCCAGATCA 
ACAGCTTCGCGTGGTGCAGACGCGGAAAGCTGAAGGAGAACAACCACTGCCATGTCGCCTGC 
TCAGCCTTGATCACTGATGACCTCACAGATGCAATTATCTGTGCCAGGAAAATTGTTAAAGA 
GA CACAAGGAATG AACT ATTGG CAAGGCT GGAAGAAACATTGTG AGGGCAGAGA CC TG T C CG 
AGTGGAAAAAAGGCTGTGAGGTTTCCTAAACTGGAACTGGACCCAGGATGCTTTGCAGCAAC 
G C C CT AGG ATTTG C AGTG AATGT C CAAAT G C CTGTGT CATCTTGTC C CGTTT CC TC CCAAT A 
TT C CTTCT CAAAC TTGGAGAGGGAAAATTAAGCTATACTTTTAAGAAAATAAAT ATTTC CAT 
TTAAATGTC 
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FIGURE 114 

MKAAGILTLIGCLVTGAESKIYTRCKIAK 

TVLDDGS IDYGI FQ INSFAWCRRGKLKENNHCHVACSAL I TDDLTDAI I CARKI VKETQGMN 
YWQGWKKHCEGRDLSEWKKGCEVS 

Signal peptide: 

amino acids 1-19 



/XT/* 7£> 



WO 00/12708 



PCT/US99/20111 



FI GURE 115 

CAGGCCATTTGCATCCCACTGTCCTTGTGTTCGGAGCCAGGCCACACCGTCCTCAGCAGTGT 
CATG TGTTAAAAACGC CAAGCTGAATATAT CATGC C CCTATTAAAA CTTGTACATGGC TC CC 
CATTGGTTTTTGGAGAAAAGTTCAAGCTTTTTACCTTGGTGTCTGCCTGTATCCCAGTGTTC 
AGGCTGGCTAGACGGCGGAAGAAGATCCTATTTTACTGTCACTTCCCAGATCTGCTTCTCAC 
CAAGAGAGATTCTTTTCTTAAACGACTATACAGGGCCCCAATTGACTGGATAGAGGAATACA 
CCACAGGCATGG CAGACTG C AT CTTAGT C AACAGCCAG TT CACAG CTG CTGTTTTTAAGGAA 
ACATT C AAGT CCCTGTCTCACATAGACC CTGATGT C CT CTATCCAT CTCTAAATGT CAC CAG 
CTTTGACTCAGTTGTTCCTGAAAAGCTGGATGACCTAGTCCCCAAGGGGAAAAAATTCCTGC 
TGCT CT CC AT C AAC AG ATACGAAAGG AAGAAAAAT CTG ACTTTGGC AC TGGAAG CC CTAGTA 

CAGCTGCGTGGAAGATTGACATCCCAAGATTGGGAGAGGGTTCATCTGATCGTGGCAGGTGG 

TTATGACGAGAGAGTCCTGGAGAATGTGGAACATTATCAGGAATTGAAGAAAATGGTCCAAC 

AGTCCGACCTTGGCCAGTATGTGACCTTCTTGAGGTCTTTCTCAGACAAACAGAAAATCTCC 

CTCCTCCACAGCTGCACGTGTGTGCTTTACACACCAAGCAATGAGCACTTTGGCATTC 

T CTGGAAGCCATGTACATG CAGTGCC CAGT CATTGCTGTT AATTC GGGTG GACC CTTGGAGT 

CCATTGACCACAGTGTCACAGGGTTTCTGTGTGAGCCTGACCCGGTGCACTTCTCAGAAGCA 

ATAGAAAAGTTCAT C CGTGAACCTTC CTTAAAAG CC AC CATGGG CC TGGCTGGAAGAGCCAG 

AGTGAAGGAAAAATTTTCCC CTGAAG CATTTACAGAACAG CT CT ACCGATAT GTTACCAAAC 

TGCTGGTAS&ATCAGATTGTTTTTAAGATCTCCATTAATGTCATTTTTATGGATTGTAGACC 

CAGTTTTGAAACCAAAAAAGAAACCTAGAATCTAATGCAGAAGAGATCTTTTAAAAAATAAA 

CTTGAGTCTTGAATGTGAGCCACTTTCCTATATACCACACCTCCCTGTCCACTTTTCAGAAA 

AACCATGT CTTTTATG CTATAATCATTC CAAATTTTGCCAGTGTTAAGTTACAAATGTGGTG 

TCATT CCATGTT CAGCAGAGTATTTT AATTATATTTT CTCGGGAT TATTG CT CT TCTGT CTA 

TAAATTTTGAATGATACTGTGCCTTAATTGGTTTTCATAGTTTAAGTGTGTATCATTATCAA 
AGTTGATTAATT TGGCTTCATAGT ATAATGAGAGCAGG GCTATTGT AGTT C C CAGATT CAAT 
CCACCGAAGTGTTCACTGTCATCTGTTAGGGAATTTTTGTTTGTCCTGTCTTTGCCTGGATC 
CATAGCGAGAGTGCTCTGTATTTTTTTTAAGATAATTT GT ATTT TTGC AC ACTG AGATATAA 
TAAAAGGTGTTTATCATAAAAAAAAAAAAAAAAAAA 
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FIGURE 116 

M PLLKli VHGS PL VFGE KF KLF TLVS AC I P V FRLARRRKKI L FYCHF PDLLLTKRDS FLKRL Y 

RAPIDWIEEYTTGMADCILVNSQFTAAVFKETFKSLSHIDPDVLYPSLNVTSFDSWPEKLD 

DLVPKGKKFLLLSINRYERKKIJLTIJU^ALVQLRGRLTSQDWERVHLIVAGGYDERVI^ 

HYQELKKMVQQSDLGQYVTFLRSFSDKQKISLLHSCTCVLYTPSNEHFGIVPLEAMYMQCPV 

IAVNSGGPLESIDHSVTGFLCEPDPVHFSEAIEKFIREPSLKATMGLAGRARVKEKFSPEAF 
TEQLYRYVTKLLV 

Signal peptide: 

amino acids 1-15 
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FIGURE 117 

GACTACGCCGATCCGAGACGTGGCTCCCTGGGCGGCAGAACCATGTTGGACTTCGCGATCTT 
CGCCGTTACCTTCTTGCTGGCGTTGGTGGGAGCCGTGCTCTACCTCTATCCGGCTTCCAGAC 
AAG C TG CAGG AAT T C CAGGG ATTACT C C AACT G AAG AAAAAG ATGG T AAT CT TC C AGATATT 
GTGAATAGTGG AAGTTTG CATGAGTT C CTGGTTAATTTGC ATGAGAGATATGGG CCTGTGGT 
CTCCTTCTGGTTTGGCAGGCGCCTCGTGGTTAGTTTGGGCACTGTTGATGTACTGAAGCAGC 
ATATCAATCC CAATAAGAC ATCGGAC CC TTTTGAAACCATGCTGAAGTCATTATTAAGGTAT 
CAATCTGGTGGTGGCAGTGTGAGTGAAAACCACATGAGGAAAAAATTGTATGAAAATGGTGT 
GACTGATT CT CTGAAG AGTAACTTTG CC CT C CT C CT AAAG CTTTCAGAAGAATTATTAGATA 
AATGGCTCTCCTACCCAGAGACCCAGCACGTGCCCCTCAGCCAGCATATGCTTGGTTTTGCT 
ATGAAGTCTGTTACACAGATGGTAATGGGTAGTACATTTGAAGATGATCAGGAACTCATTCG 
C TT CCAGAAG AAT C AT GGC A CAGTTTGGTCTG AG ATTGGAAAAGGCTTTCTAGATGGGTCAC 
TTGATAAAAACATGACT CGGAAAAAACAATATGAAGATGC CCTCATGC AACTGGAGTCTGTT 
T T AAGG AACAT CAT AAAAG AAC G AAAAGG AAGG AACTT C AG T CAACAT ATTT TC AT TG ACT C 
C TT AGT ACAAG GGAAC CTT AATGA C C AACAGAT C CTAGAAGA CAG T ATGATATT TT CT CT GG 
CCAGTTGCATAATAACTG CAAAATTGTG TACCTGGGCAAT CTGTTTTTTAAC CACCTCTGAA 
GAAGTTCAAAAAAAATTATATGAAGAGATAAACCAAGTTTTTGGAAATGGTCCTGTTACTCC 
AGAGAAAATTGAGCAG CT CAGATATTGT CAGCATGTGCTTTGTGAAACTGTT CGAACTG CCA 
AACTGACT CCAGTTTCTGCC CAGCTTCAAGATATTGAAGGAAAAATTGACCGATTTATTATT 
CCTAGAGAGACCCTCGTCCTTTATGCCCTTGGTGTGGTACTTCAGGATCCTAATACTTGGCC 
AT CTCCACACAAGTTTGATC CAGATC GGTTTGATGATGAATTAGTAATGAAAACTTT TTCC T 
CACTTGGATT CTCAGG CACACAGGAGTGT C CAGAGTTGAGGTTTGCATAT AT GGTGAC CACA 
GTACTTCTTAGTGTATTGGTGAAGAGACTGCACCTACTTTCTGTGGAGGGACAGGTTATTGA 
AACAAAGTATGAACTGGTAACATCATCAAGGGAAGAAGCTTGGATCACTGTCTCAAAGAGAT 
ATTMAATTTTATACATTTAAAATC^TTGTTAAATTGATTGAGGAAAACAACCATTTAAAAA 
AAATCTATGTT GAAT CCTTTTATAAAC CAGTATC ACTTTGTAATAT AAACAC CTATTTGTAC 
TTAA 
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FIGURF118 

MLDFAIFAVTFLLALVGAVLYLYPASRQAAGIPGITPTEEKDGNLPDIVNSGSLHEFLVNLH 
ERYGPWSFWFGRRLWSLGTVDVLKQHINPNKTSDPFETMLKSLLRYQSGGGSVSENHMRK 
KLYENGVTDSLKSNFALLLKLSEELLDKWLSYPETQHVPLSQHMLGFAMKSVTQMVMGSTFE 
DDQEVIRFQKNHGTWSEIGKGFLDGSLDKNMTRKKQYEDALMQLESVLRNIIKERKGRNFS 
QHIFIDSLVQGNLNDQQILEDSMIFSLASCIITAKLCTWAICFLTTSEEVQKKLYEEINQVF 
GNGPVTPEKIEQLRYCQHVLCETV^TAKLTPVSAQLQDIEGKIDRFIIPRETLVLYALGVVL 
QDPNTWPSPHKFDPDRFDDELVMKTFSSIXSFSGTQECPEIJIFAYI^TVLLSVLVKRLHLLS 
VEGQ V I E TKYEL VTS S RE EAW I TVS KR Y 

Signal peptide: 

amino acids 1-18 

Transmembrane domain : 

amino acids 271-290 
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FIGURE 119 

CTAGATTTGTCGGCTTGCGGGGAGACTTCAGGAGTCGCTGTCTCTGAACTTCCAGCCTCAGA 
GACCGCCGCCCTTGTCCCCGAGGGCCATGGGCCGGGTCTCAGGGCTTGTGCCCTCTCGCTTC 
CTGACGCTCCTGGCGCATCTGGTGGTCGTCATCACCTTATTCTGGTCCCGGGACAGCAACAT 
ACAGGCCTGCCTGCCTCTCACGTTCACCCCCGAGGAGTATGACAAGCAGGACATTCAGCTGG 
TGGCCGCGCTCTCTGTCACCCTGGGCCTCTTTGCAGTGGAGCTGGCCGGTTTCCTCTCAGGA 
GTCTCCATGTTCAACAGCACCCAGAGCCTCATCTCCATTGGGGCTCACTGTAGTGCATCCGT 
GGCCCTGTCCTTCTTCATATTCGAGCGTTGGGAGTGCACTACGTATTGGTACATTTTTGTCT 
TCTGCAGTGCCCTTCCAGCTGTCACTGAAATGGCTTTATTCGTCACCGTCTTTGGGCTGAAA 
AAGAAACCCTTCTGATTAC CTTCATGACGGGAACCT AAGGACGAAGC CTACAGGGGCAAGGG 
CCGCTTCGTATTCCTGGAAGAAGGAAGGCATAGGCTTCGGTTTTCCCCTCGGAAACTGCTTC. 
TGCTGGAGGATATGTGTTGGAATAATTACGTCTTGAGTCTGGGATTATCCGCATTGTATTTA 
GTGCTTTGTAATAAAATATGTTTTGTAGTAACATTAAGACTTATATACAGTTTTAGGGGACA 
ATTAAAAAAAAAAAA 
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FIGURE 120 

MGRVSGLVPSRFLTLLAHLVWITLFWSRDSNIQACLPLTFTPEEYDKQDIQLVAALSVTLG 
LFAVELAGFLSGVSMFNSTQSL I S IGAHCS AS VALS FF I FERWE CTTYWY I FVF CSALPAVT 
EMALFVTVFGLKKKPF 

Transmembrane domain: 

amino acids 12-28 (type II) , 51-66, 107-124 
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FIGURE 121 

TCCCGGACCCTGCCGCCCTGCCACT&2GTCCCGCCGCTCTATGCTGCTTGCCTGGGCTCTCC 
C CAGCCT C CT TCGACT CGGAGCGGCTCAGGAGACAGAAGACC CGGC CTGCT G CAG C CC CATA 
GTGCCCCGGAACGAGTGGAAGGCCCTGGCATCAGAGTGCGCCCAGCACCTGAGCCTGCCCTT 
ACGCTATGTGGTGGTATCGCACACGGCGGGCAGCAGCTGCAACACCCCCGCCTCGTGCCAGC 
AGCAGGCCCGGAATGTGCAG CACT ACCACATGAAGACACTGGGCTGGTG CGACGTGGGCTAC 
AACTTCCTGATTGGAGAAGACGGGCTCGTATACGAGGGCCGTGGCTGGAACTTCACGGGTGC 
CCACTCAGGTCACTTATGGAACCCCATGTCCATTGGCATCAGCTTCATGGGCAACTACATGG 
AT CGGGTG C C CACACC C CAGGC CAT C CGGGC AG C C CAGGGT CTACTGGC CTGCGGTGTGGCT 

CAGGGAGCCCTGAGGTCCAACTATGTGCTCAAAGGACACCGGGATGTGCAGCGTACACTCTC 
TCCAGGCAACCAGCTCTACCACCTCATCCAGAATTGGCCA 

CTGCTGATCCGCACCCCATTCCTCCCCTCCCATGGCCAAAAACCCCACTGTCTCCTTCTCCA 
ATAAAGATGTAGCTC 
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FIGURE 122 

msrrsmllawalpsllrlgaaqetedpaccspivprnewkalas2caqhlslplryvvvsht 
agsscntpascqqqarotqhyhmktlgwcdvgynfligedglvysgrgwnftgahsghl™p 

MS IGI SFMGrTYMDRVPTPQAIRAAQGLLACGVAQGAL^^ 
IQNWPHYRSP 

Signal peptide: 

amino acids 1-20 



/23 



WO 00/12708 



PCT/US99/20111 



FIGURE 123 

CTGGGACCCCGAAAAGAGAAGGGGAGAGCGAGGGGACGAGAGCGGAGGAGGAAGATGCAACT 
GACTCGCTGCTGCTTCGTGTTCCTGGTGCAGGGTAGCCTCTATCTGGTCATCTGTGGCCAGG 
ATGATGGTCCTCCCGGCTCAGAGGACCCTGAGCGTGATGACCACGAGGGCCAGCCCCGGCCC 
CGGGTGCCTCGGAAGCGGGGCCACATCTCACCTAAGTCCCGCCCCATGGCCAATTCCACTCT 
CCTAGGGCTGCTGGCCCCGCCTGGGGAGGCTTGGGGCATTCTTGGGCAGCCCCCCAACCGCC 
CGAACC ACAG CC CC C CACC CTCAGC CAAGGTGAAGAAAAT CTTTGG CTGGGGCGACTTCTAC 
TCCAACATCAAGACGGTGGCCCTGAAGCTGCTCGTCACAGGGAAGATTGTGGACCATGGCAA 
TGGGACCTTCAG CGTCCACTTC CAACACAATGCCACAGGC CAGGGAAACATCTCCATCAGCC 
TCGTGCCC C C CAGT AAAG CTGT AG AGTT CCAC CAGGAAC AGCAGAT CTT CATCGAAGCCAAG 
GCCTCCAAAATCTTCAACTGCCGGATGGAGTGGGAGAAGGTAGAACGGGGCCGCCGGACCTC 
G CTT TG CAC C CACGACCCAGCCAAGATCTG CT CCCGAGACCACG CT CAG AG CT CAG CCAC CT 
GGAG CTGCTCC CAG CC CTTCAAAGTCG T CTGTGT CTACATCG CCTTCTACAGCACGGAC TAT 
CGGCTGGT C CAGAAGGTGTGCC CAG ATTACAACTAC CATAGT GAT ACCCC CT ACT ACC CATC 
TGGGTGACCCGGGGCAGGCCACAGAGGCCAGGCCAGGGCTGGAAGGACAGGCCTGCCCATGC 
AGGAGACCATCTGGACACCGGGCAGGGAAGGGGTTGGGCCTCAGGCAGGGAGGGGGGTGGAG 
ACGAGGAGATGCCAAGTGGGGCCAGGGCCAAGTCTCAAGTGGCAGAGAAAGGGTCCCAAGTG 
CTGGTCCCAACCTGAAGCTGTGGAGTGACTAGATCACAGGAGCACTGGAGGAGGAGTGGGCT 
CTCTGTGC^GCCTCACAGGGCTTTGCCACGGAGCCACAGAGAGATGCTGGGTCCCCGAGGCC 
TGTGGG CAGGC CGATC AGTGTGGC C CCAGATCAAGTCATGGG AGGAAG CTAAGC CCTTGGTT 
CTTG CC AT CCTGAG GAAAGATAGCAACAGGGAGGGGGAGATTT CATCAG TGTGGACAGCCTG 
TCAACTTAGGATGGATGGCTGAGAGGGCTTCCTAGGAGCCAGTCAGCAGGGTGGGGTGGGGC 
CAGAGGAGCTCTCCAGCCCTGCCTAGTGGGCGCCCTGAGCCCCTTGTCGTGTGCTGAGCATG 
GCATGAGGCTGAAGTGGCAACCCTGGGGTCTTTGATGTCTTGACAGATTGACCATCTGTCTC 
CAGCCAGGCCACCCCTTTCCAAAATTCCCTCTTCTGCCAGTACTCCCCCTGTACCACCCATT 
GCTG ATGG CACACCCAT CCTTAAG CTAAGACAGG ACGATTGT GGT C CTCC C ACACTAAGG CC 
ACAGCCCATCCGCGTGCTGTGTGTCCCTCTTCCACCCCAACCCCTGCTGGCTCCTCTGGGAG 
CATC CATGTCCCGGAGAGGGGTCCCTCAACAGTCAGCCTCACCTGTCAGACCGGGGTT CTCC 
CGGATCTGGATGGCGCCGCCCTCTCAGCAGCGGGCACGGGTGGGGCGGGGCCGGGCCGCAGA 
GCATGTGCTGGATCTGTTCTGTGTGTCTGTCTGTGGGTGGGGGGAGGGGAGGGAAGTCTTGT 

GAAACCGCTGATTGCTGACTTTTGTGTGAAGAATCGTGTTCTTGGAGCAGGAAATAAAGCTT 
GCCCCGGGGCA 
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FIGURE 124 

></usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA66521 
xsubunit 1 of 1, 252 aa, 1 stop 
><MW: 28127, pi: 8.91, NX(S/T): 5 

MQLTRCCFVFLVQGSLYLVICGQDDGPPGSEDPERDDHEGQPRPRVPRKRGHISPKSRPMAN 
STLLGLIAPPGEAWGILGQPPNRPNHSPPPSAKVKKIFGWGDFYSNIKTVALNLLVTGKIVD 
HGNGTFSVHFQHNATGQGNISISLVPPSKAVEFHQEQQIFIEAKASKIFNCRMEWEKVERGR 
RTSLCTHDPAKICSRDHAQSSATWSCSQPFKWCVYIAFYSTDYRLVQKVCPDYNYHSDTPY 
YPSG 

Important features of the protein: 
Signal peptide: 
amino acids 1-14 

N-glycosylation sites. 

amino acids 62-65, 127-130, 137-140, 143-146 

2-oxo acid dehydrogenases acyltransf erase 
amino acids 61-71 
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FIGURE 125 



GTGAATGTGAGGGTTTGATGACTTT CAG ATGTCTAGGAAC CAGAGTGGGTGCAGGGGC CCCA 
GGCAGGGCTGATTCTTGGGCGGAGGAGAGTAGGGTAAAGGGTTCTGCATGAGCTCCTTAAAG 
GACAAAGGTAACAGAG CCAG CG AG AG AG CT CGAGGGGAG ACTTTGACTTCAAGC CACAGAAT 
TGGTGGAAGTGTGCGCGCCGCCGCCGCCGTCGCTCCTGCAGCGCTGTCGACCTAGCCGCTAG 
CATCTTCCCGAGCACCGGGATCCCGGGGTAGGAGGCGACGCGGGCGAGCACCAGCGCCAGCC 
GGCTGCGGCTGCCCACACGGCTCACCATGGGCTCCGGGCGCCGGGCGCTGTCCGCGGTGCCG 
GCCGTGCTGCTGGTCCTCACGCTGCCGGGGCTGCCCGTCTGGGCACAGAACGACACGGAGCC 
CATCGTGCTGGAGGGCAAGTGTCTGGTGGTGTGCGACTCGAACCCGGCCACGGACTCCAAGG 
GCTCCTCTTCCTCCCCGCTGGGGATATCGGTCCGGGCGGCCAACTCCAAGGTCGCCTTCTCG 
GCGGTGCGGAGCAC CAAC CA CG AG CCAT CCGAGATGAG CAACAAGACGCGCATCATTTACTT 
CGATCAGATCCTGGTGAATGTGGGTAATTTTTTCACATTGGAGTCTGTCTTTGTAGCACCAA 
GAAAAG GAATTTAC AGTTT C AGTTTT CACGTGATTAAAGTCTAC CAGAGCCAAACTAT CCAG 
GTTAACTTGATGTTAAATGGAAAACCAGTAATATCTGCCTTTGCGGGGGACAAAGATGTTAC 
TCGTGAAGCTGCC^CGAATGGTGTCCTGCTCTACCTAGATAAAGAGC^TAAGGTTTACCTAA 
AACTGGAGAAAGGTAATTTGGTTGGAGGCTGGCAGTATTCCACGTTTTCTGGCTTTCTGGTG 
TTCCCCCTASASGATTCAATTTCTCCATGATGTTCATCCAGGTGAGGGATGACCCACTCCTG 
AGTTATTGGAAGAT CATTTTTTCATCAT TGGATTGATGTCTTTT ATTG GTTTCTCATG GGTG 
GAT ATGGATT CT AAGGATTCTAGCCTGT CTGAAC CAATACAAAATTTCACAGATT ATTTGTG 
TGTGTCTGTTT CAGTAT ATTTGGATTGGGACTCTAAGC AG ATAATACCTATG CTTAAATGTA 
ACAGTCAAAAG CTGT CTGCAAGACTTATT CTG AATTTCATTT CCTG GG ATTACTGAATTAGT 
TACAGATGTGGAATTTTATTTGTTTAGTTTTAAAAGACTGGCAACCAGGTCTAAGGATTAGA 
AAACTCTAAAGTTCTGACTTCAAT CAACGG TT AGTGTGAT AC TGCCAAAGAACTGTATACTG 
TGTTAATATATTGATTATATTTGTTTTTATTCCTTTGGAATTAGTTTGTTTGGTTCTTGTAA 
AAAACTTGGATTTTTTTTTTCAGTAACTGGTATTATGTTTTCTCTTAAAATAAGGTAATGAA 
TGGCTTGCCCACAAATTTACCTTGACTACGATATCATCGACATGACTTCTCTCAAAAAAAAA 
GAATGCTTCATAGTTGTATTTTAATTGTATATGTGAAAGAGTCATATTTTCCAAGTTATATT 
TT CTAAGAAG AAG AAT AG AT CATAAATCTG ACAAGGAAAAAG TTGCTTAC CCAAAAT CTAAG 
TGCTCAATCCCTGAGCCTCAGCAAAACAGCTCCCCTCCGAGGGAAATCTTATACTTTATTGC 
TCAACTTTAATTAAAATGATTGATAATAACCACTTTATTAAAAACCTAAGGTTTTTTTTTTT 
T C CG TAGACATGAC CACT TT ATT AACTGGTGGTGGGATGCTGTTGTTT CTAATT ATACCTAT 
TTTTCAAGGCTTCTGTTGTATTTGAAGTATCATCTGGTTTTGCCTTAACTCTTTAAATTGTA 
TATATTTATCTGTTTAGCTAATATTAAATTCAAATATCCCATATCTAAATTTAGTGCAATAT 
CTTGTCTTTTGTATAGGTCATATGAATTCATAAAATTATTTATGTCTGTTATAGAATAAAGA 
TTAATATATGTTAAAAAAA 
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FIGtlttF 126 

MGSGRRALS AVPAVLLVLTLPGLP VWAQNDTE P I VLEGKCLWCDSNP ATDS KGS S S S PLG I 

SVRAANSKVAFSAVRSTNHEPSEMSNKTRI I YFDQI LVNVGNFFTLESVFVAPRKG I YS FS F 

HVIKVYQSQTIQVNLMLNGKPVISAFAGDKDVTO 

GWQYSTFSGFLVFPL 

Signal peptide: 

amino acids 1-27 
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FIGURE 127 

CGGTGGCCA^ACTGCGGCCGTGTTCTTCGGCTGCGCCTTCATTGCCTTCGGGCCTGCGCTC 
GCCCTTTATGTCTTCACCATCGCCATCGAGCCGTTGCGTATCATCTTCCTCATCGCCGGAGC 
TTTCTTCTGGTTGGTGTCTCTACTGATTTCGTCCCTTGTTTGGTTCATGGCAAGAGTCATTA 
TTGACyUVCAAAGATGGACC^VACACAGAAATATCTGCTGATCTTTGGAGCGTTTGTCTCTGT 
TATAT CCAAGAAATGTT C CGAT TTGCAT AT TATAAACT CTTAAAAAAAGC CAGTGAAGGTTT 

GAAGAGTATAAACCCAGGTGAGACAGCACCCTCTATGCGACTGCTGGCCTATGTTTCTGGCT 
TGGGCTTTGGAATCATGAGTGGAGTATTTTCCTTTGTGAATACCCTATCTGACTCCTTGGGG 
CCAGGCACAGTGGGC^TTCATGGAGATTCTCCTCAATTCTTCCTTTATTCAGCTTTCATGAC 
GC TGGTCATTATCTTG CTGCATGTATTCTGGGG CATTG TATTT TTTG ATGG CTGTGAGAAGA 

AAAAGTGGGGCATCCTCCTTATCGTTCTCCTGACCCACCTGCTGGTGTCAGCCCAGACCTTC 
ATAAGTTCTTATTATGGAATAAACCTGGCGTCAGCATTTATAATCCTGGTGCTCATGGGCAC 
CTGGGCATTCTTAGCTGCGGGAGGCAGCTGCCGAAGCCTGAAACTCTGCCTGCTCTGCCAAG 
AC AAG AACTTTCTT CTTTACAAC CAGCG CTCCAGATAACC T CAGGG AA CCAG CACTTC CCAA 
AC CG CAGACT ACATCTTT AG AGGAAGCACAACTGTG CCTTTTT CTGAAAATC CCTTTTTCTG 
GTGGAATTGAGAAAGAAATAAAACTATGCAGATA 
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FIGURE 128 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA66658 
xsubunit 1 of 1, 257 aa, 1 stop 
><MW: 28472, pi: 9.33, NX(S/T) : 0 

MTAAVFFGCAFIAFGPALALYVFTIAI2PLRI IFLIAGAFFWLVSLLISSLVWFMARVI IDN 
KDGPTQKYLLIFGAFVSVYIQEMFRFAYTOI^KKA 

GIMSGVFSFVNTLSDSLGPGTVGIHGDSPQFFLYSAFMTLVIILLHVFWGIVFFDGCEKKKW 
GI LL I VLLTHLLVS AQTF I S SYYG INLAS AFI ILVLMGTWAFLAAGGSCRSLKLCLLCQDKN 
FLLYNQRSR 

Important features of the protein: 
Signal peptide: 

amino acids 1-19 

Transmembrane domains: 

amino acids 32-51, 119-138, 152-169, 216-235 

Glycosaminoglycan attachment site. 

amino acids 120-123 

Sodium: neurotransmitter symporter family protein 

amino acids 31-65 
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FIGURE 129 



CGGCAACCAGC CGCCGCCACCACCGCTGCCACTGC CGCC CTGCCGGGGCCATGTTCGCTCTQGGCTTGCCCTTCT 

AGTTTGAGCECACCTACGTGGACGAGGTCAACAGCGAGCTGCT^ 
GCAACAGGACAGAGGGCGTGCGTGTGTCTGTGAACGTCCTGAACAAGCAGAAGGG^ 

TCCGCCAGAAGGAGGCTCTGGTGTCCTTCCAGGTGCCCCTAATCCTGCGAGGGATGTTTCAGCGCAAGTACOT 

ACCAAAAAGTGGAACGAACCCTGTGTCAGCCCCCCACCAAGAATGAGTCGGAG 

TGTCCA.CCCTGTCA.CCAGTCAACACCACATACCAGCTCCGGGTCAGCCGCATGGAC 

GGG AGCAGTTCAGCTT CAAT AC CACAGC AG CACAG C C C C AGTAC TTCAAG TATGAGTrC CCTGAAGG CGTGGACT 

TCTATGACCTGGACAACAACGTAGCCTTGATCGGCATGTACCAGACGATGACOVAGAAGGCGGC 

AGCGCAAAGACTTCCCCAGCAACAGCTTTTATGTGGT 

CCCTGCCTTTCTACCCCTTCGCAGAAGATGAACCGGTC^ 

TGTCTCAAGCAGTCACGTCTGAGGCATACGTCAGTGGGATGCTCTTTTGCCTGGGTATATTTCT 

TGCTGACCGTCCTCCTCGCCTGCTGGGAGAACTGGAGGCAGAAGAAGAAGACCCTGCTGGTGGCCATrGACCGAG 

CCTGCCCAGAAAGCGGTCACCCTCGAGTCCTGGCT 

ATGGCTCCTTTGAGAATGTTTCTGGATCTACCGA^ 

GTTACCAGGGCCGCTCCTTTGAACCTGTAGGTACTCGGCCCC 

ACTACGACACATTGACCGACATCGATTCCGACAAGAATGTCATTCGCACCAAGCAATACCTCTATGTGGCTGACC 

TGGCACGGAAGGACAAGCGTGTTCTGCGGAAAAAGTACCAGATCTACTTCTGGAACATTGCCACCATTGC^ 

TCTATGCCCTTCCTGTGGTGCAGCTGGTGATCACCTACGAGACGGTGGTGAATGT 

GCTACTACAACTTCCTCTGCGCCCACCCACTGGGCAATCTCAGCGCCT^ 

ACATCCTGCTGGGGCTGCTTTTCCTGCTCATCATCCTGCAACGGGAGATCAACCACAACCG^ 

ATGACCTCTGTGCCCTGGAATGTGGGATCCCCAAACACTTTGGGCTTTTCTACGCCATGGGCACAGCCCTG^ 

TGGAGGGGCTGCTCAGTGCTTGCTATCATGTGTGCCCCAACTATACCAATTTCCAGTTTC 

ACATGATCGCCGGACTCTGCATGCTGAAGCTCTACCAGAAGCGGCAC 

CCTACGCCTGCCTGGCCATTGTCATCTTCTTCTCTGTGCTGGGCGTGGTCmG 

GGATCGTCTTCTCCATCATTCACATCATCGCCACCCTGCTCCTCAGCACGCAGCTCTA 

AACTGGACTCGGGGATCTTCCGC CGCATC CTCCACGTGCTCTACACAGACTGCATCCGGCAGTGCAGCGGGCCGC 

TCTACGTGGACCGCATGGTGCTGCTGGTCATGGGCAACGTCATCAACTGGTCGCT 

TGCGCCCCAATGATTTCGCTTCCTACTTGTTGGCCATTTC 

TCATCATGAAGCTCCGGAGTCGGGAGAGGATCAAGCTCATCCCCCTGCTCTGCATC 

GGGGCTTCGCGCTCTTCTTCTTCTTCCAGGGACTCAGCACCTGGCAGAAAACCCCTGCAGAGTCG 

ACCGGGACTGCATCCTCCTCGACTTCTTTGACGACCACGACATCT 

AGGAGCTGGGCCCTTCGCITCACCTCAAGGGGCCCTGAGCTCCTTTGTGTCATA 
GTGGGGATGAGTCCCAGCACCGCTGCCCAGCACTGGATGGCAGCAGGACAGCCAGGTCTAGOT 
GGGACAGCCATGGGGTGGCATGGAACCTTGCAGCTGC CC TCTGCCGAGGAGCAGGCCTGCTCCCCTGGAACCCCC 
AGATGTTGGCCAAATTGCTGCTTTCTTCTCAGTGTTTC 



ACAATGCCCCAGCCTGGGACCTAAGGCCTCTTT 
ATCTCTGTCCTGTATCAGGGCCCCAGTTCTCTTTGGGCTGTCCCTGGCTGCCATCAC^ 

AGGATGGATGGGGGTATGAGATTTTGGGGGTTGGCCAGCTGGTGCCAGACTTTTGGTGCTAAGGCCTGCAAG^ 

CCTGGGGCAGTGCGTATTCTCTTCCCTCTGACCTGTGCTCAGGGCTGGCTCTTTAGCAATGCGCTCAG^ 

TG AGAACCGCC TTCTGATTCAAGAGGCTGAATTCAGAGGTCAC CTCTTCATCCCATCAGCTCCCAGACTGATGCC 

AGCACCAGGACTGGAGGGAGAAGCGCCTCACCCCTTCCCTTCCTTCTTTCCAGGCCC 

AGCTGGTGGCCTTTCAGTGCCATTGACACTGCCCAAGAATGTCCAGGGGCAAAGGAGGGAT^ 

CCCGTTCTGCC TC CACAGCTGTGGGCACC CCAGTG CCTACCTTAGAAAGGGGCTTCAGGAAGGGATGTGCTGTTT 

CCCTCTACGTGGCCAGTCCTAGCCTCGCTCTAGGACCCAGGGCrGGCTTCTAAGTTTCra 

AGTTCTGTGTTAGTCATGCACACACATACCTATGAAACCTTGGAGTTTACAAAGAATTC 

CCTGGCCACCCTGGTCCTTGGATCCCCTTCOTCCCACCTGGTCCACCCCAGATG 

CGGGGCCTCTGCTTTGGGGATGGGAATGTGTTTTTCTCCCAAACT 

AGATGAGGTGGGTTCTGGATCTTTTCTCAGAGCGTCTCCATGCTATGGTTGCATTTCCGTTTTOT 
TGCATTCAATAAACAACCAGACTCAAAAAAAAAAAAAAA 
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FIGURE 130 

></usr/seqdb2/ast/DNA/Dnaseqs.min/ss.DNA66659 
xsubunit 1 of 1, 832 aa, 1 stop * 
><MW: 94454, pi: 6 . 94 , NX(S/T): 12 
MFALGLPFLVLLVASVESHLGVLGPKNVSQKDAEFERTYTO 

EGVRVSVNVLNKQKGAPLLFWRQKEAVVS FQVPLILRGMFQRKYLYQKVERTLCQPPTKNE 
SEIQFFYVDVSTLSPVNTTYQLRVSRMDDFVLRTGEQFSFNTTAAQP.QYFKYEFPEGVDSVI 
VKVTSNKAFPCSVISIQDVLCPVYDLDNNVAFIGMYQTMTKKAAITVQRKDFPSNSFYV^ 
VKTEDQACGGSLPFYPFAEDEPVDQGHRQKTLSVLVSQAVTSEAYVSGMLFCLGIFLSFYLL 
TVLLACWENWRQKKKTLLVAIDRACPESGHPRVLADS FPGSS PYEGYNYGSFENVSGSTDGL 
VDSAGTGDLSYGYQGRSFEPVGTRPRVDSMSSVEEDDYDTLTDIDSDK23VIRTKQYLYVADL 
ARKDKRVLRKKYQIYFTOIATIAVFYALPWQLVITYQTVVNVTGNQDICYYNFLCAHPLGN 
LSAFNNILSNLGYILLGLLFLL 1 1 LQRE INHNRALLRNDLCALECG I P KHFGLF YAMGTALM 
MEGLLSACYHVCPNYTNFQFDTSFMYMIAGLCMLKLYQKRHPDINASAYSAYACLAIVIFFS 
VLGWFGKGNTAFWI VFS 1 1 HI I ATL LL S TQL YYMGRWKLDS G I FRR I LH VL YTDC I RQ CS G 
PL YVDRMVLL VMGNV I NWS L AA YGL I MR PN DF AS YLLA IG I CNLLL YF AFY I IMKLRSGER I 

KLIPLLCIVCTSWWGFALFFFFQGLSTWQKTPAESREHNRDCILLDFFDDHDIWHFLSSIA 
MFGS FLVLLTLDDDLDTVQRD KI YVF 

Important features of the protein: 
Signal peptide: 

amino acids 1-18 

Transmembrane domains : 

amino acids 292-317, 451-470, 501-520, 607-627, 751-770 

Leucine zipper pattern. 

amino acids 497-518 

N-glycosylation sites, 

amino acids 27-30, 54-57, 60-63, 123-126, 141-144, 165-168, 364- 
367, 476-479, 496-499, 572-575, 603-606, 699-702 
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FIGURE 131 

GCTCAAGTGCCCTGCCTTGCCCCACCCAGCCCAGCCTGGCCAGAGCCCCCTGGAGAAGGAGC 
TCTCTTCTTGCTTGGCAGCTGGACCAAGGGAGCCAGTCTTGGGCGCTGGAGGGCCTGTCCTG 
ACCATGGTCCCTGCCTGGCTGTGGCTGCTTTGTGTCTCCGTCCCCCAGGCTCTCCCCAAGGC 
CCAGCCTGCAGAGCTGTCTGTGGAAGTTCCAGAAAACTATGGTGGAAATTTCCCTTTATACC 
TGACCAAGTTGCCGCTGCCCCGTGAGGGGGCTGAAGGCCAGATCGTGCTGTCAGGGGACTCA 
GGCAAGGCAACTGAGGGCCCATTTGCTATGGATCCAGATTCTGGCTTCCTGCTGGTGACCAG 
GGCCCTGGACCGAGAGGAGCAGGCAGAGTACCAGCTACAGGTCACCCTGGAGATGCAGGATG 
GACATGTCTTGTGGGGTCCACAGCCTGTGCTTGTGCACGTGAAGGATGAGAATGACCAGGTG 
CCCCATTTCTCTCAAGCCATCTACAGAGCTCGGCTGAGCCGGGGTACCAGGCCTGGCATCCC 
CTTCCTCTTCCTTGAGGCTTCAGACCGGGATGAGCCAGGCACAGCCAACTCGGATCTTCGAT 
TCCACATCCTGAGCCAGGCTCCAGCCCAGCCTTCCCCAGACATGTTCCAGCTGGAGCCTCGG 
CTGGGGGCTCTGGCCCTCAGCCCCAAGGGGAGCACCAGCCTTGACCACGCCCTGGAGAGGAC 
CTACCAGCTGTTGGTACAGGTCAAGGACATGGGTGACCAGGCCTCAGGCCACCAGGCCACTG 
CCACCGTGGAAGTCTCCATCATAGAGAGCACCTGGGTGTCCCTAGAGCCTATCCACCTGGCA 
GAGAAT CT CAAAGT C CTATACCCGCAC CACATGG CC CAGGTACACTGG AG TGGG6GTGATGT 
GC ACTATCAC CTGG AGAGCCATC CC C CGGGACCCTTTG AAGTGAATGC AG AGGGAAAC CT CT 
ACGTGACCAGAGAGCTGGACAGAGAAGCCCAGGCTGAGTACCTGCTCCAGGTGCGGGCTCAG 
AATTCCCATGGCGAGGACTATGCGGCCCCTCTGGAGCTGCACGTGCTGGTGATGGATGAGAA 
TG ACAACGTG CCTAT CTGCCCTCC CCGTGAC C CCAC AGTCAG CATC CCTGAG CTCAGT CCAC 
CAGGTACTGAAGTGACTAGACT GT CAGCAG AG GATG CAGATG CCCC CG GCT C CCCCAATTCC 
CACGTTGTGTATCAGCT C CTGAGC C CTG AG C C TG AGGATGGGGTAG AGGGGAGAG CCTTCCA 
GGTGGACCCCACTTCAGGCAGTGTGACGCTGGGGGTGCTCCCACTCCGAGCAGGCCAGAACA 
TCCTGCTTCTGGTGCTGGCCATGGACCTGGCAGGCGCAGAGGGTGGCTTCAGCAGCACGTGT 
GAAGTCGAAGTCGCAGTCACAG AT ATCAATG ATCAC G C CC CTGAGTT CATCACTT CCCAGAT 
TGGGCCTATAAGCCTCCCTGAGGATGTGGAGCCCGGGACTCTGGTGGCCATGCTAACAGCCA 
TTGATGCTGACCTCGAGCCCGCCTTCCGCCTCATGGATTTTGCCATTGAGAGGGGAGACACA 
GAAGGG ACTTTTGGC CTGGATT GGGAGC CAGACT CTGGG CATGTTAGACTCAGACTCTGCAA 
GAAC CT CAGTTATGAGG CAGCT CC AAGT CATGAGGTGGTGGTGGTGGTG CAG AGTGTGGCGA 
AG CTGGTGGGG CCAGG CC CAGG C C CTGGAGCCACCGC CACGGTGACTGTG CTAGTGGAGAGA 
GTGATG CC AC CCCC CAAGTTGGACCAGG AGAGCTACGAGGCCAGTGTC CC CATCAGTG CC CC 
AGCCGGCTCTTTCCTGCTGACCATCCAGCCCTCCGACCCCAT<^GCCGAACCCTCAGGTTCT 
CCCTAGTCAATGACTCAGAGGGCTGGCTCTGCATTGAGAAATTCTCCGGGGAGGTGCACACC 
GCCCAGTCCCTGCAGGGCGCCCAGCCTGGGGACACCTACACGGTGCTTGTGGAGGCCCAGGA 
TACAGCCCTGACTCITGCCCCrGTGCCCTCCCAATACCTCTGCACACCCCGCCAAGACCATG 
GCTTGATCGTGAGTGGACCCAGCAAGGACCCCGATCTGGCCAGTGGGCACGGTCCCTACAGC 
rrCACCCTTGGTCCCAACCCCACGGTGCAACGGGATTGGCGCCTCCAGACTCTCAATGGTTC 
CCATGCCTACCTCACCTTGGCCCTGCATTGGGTGGAGCCACGTGAACACATAATCCCCGTGG 
TGGTCAGCCACAATGCCCAGATGTGGCAGCTCCTGGTTCGAGTGATCGTGTGTCGCTGCAAC 
GTGGAGGGGCAG TGCATG CGCAAGGTGGGCCGCATGAAGGGCATGCCCACGAAGCTGTCGGC 
AGTGGGCATCCTTGTAGG CACCCTGGTAGC AATAGGAATCTTCCTCAT CCTCATTTTCACCC 
ACTGGACCATGTCAAGGAAGAAGGACCCGGATCAACCAGCAGACAGCGTGCCCCTGAAGGCG 
ACTGTCTGAATGGCCCAGGCAGCTCTAGCTGGGAGCTTGGCCTCTGGCTCCATCTGAGTCCC 
CTGGGAGAGAGC CCAGCAC C CAAG AT CCAG CAGGGGAC AGGACAGAGTAGAAGCC CCTCCAT 
CTGCCCTGGGGTGGAGGCACCATCACCATCACCAGGCATGTCTGCAGAGCCTGGACACCAAC 
TTTATGGACTGCCCATGGGAGTGCTCCAAATGTCAGGGTGTTTGCCCAATAATAAAGCCCCA 
GAGAACTGGG CTGGG CCCTATGGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAG 

/3Z /£ 
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FIGURE 133 

MVPAWLWLLCVSVPQALPKAQPAELSVEVPENYGGNFPLYLTKLPLPREGAEGQIVLSGDSG 
KATEGPFAMDPDSGFIiVTRALDREEQAEYQLQVTLEMQDGHVLWGPQPVLVHVKDENDQVP 
HFSQAI YRARLSRGTRPG I P FLFLEASDRDEPGTANSDLRFHI LSQAPAQPS PDMFQLEPRL 
GALALSPKGSTSLDHALERTYQLLVQVKDMGDQASGHQATATVEVS I IESTWVSLEPIHLAE 
NLKVLYPHHMAQVHWSGGDVHYHLESHPPGPFE 

SHGEDYAAPLELHVLVMDENDNVP I CPPRDPTVS I PELSPPGTEVTRLSAEDADAPGSPNSH 

VVYQLLSPEPEDGVEGRAFQVDPTSGSVTLGVLPLRAGQNILLLVLiATO 

VE VAVTD I NDHAPE FITSQIGPISLP ED VE PGTL VAML TA I DADLE P AFRLMD F AI ERGDTE 

GTFGLDWEPDSGHVRLRLCKNLSYEAAPSHEVWWQSVAKLVGPGPGPGATATVTVLVERV 

MPPPKLDQESYEASVPISAPAGSFLLTIQPSDPISRTLRFSLVNDSEGWLCIEKFSGEVHTA 

QSLQGAQPGDTYTVLVEAQDTALTLAPVPSQYLCTPRQDHGLIVSGPSKDPDLASGHGPYSF 

TLGPNPTVQRDWRLQTLNGSHAYLTLALHWVEPREH 1 1 PVWSHNAQMWQLLVRVI VCRCNV 

EGQCMRKVGRMKGMPTK^SAVGILVGTLVA^ 

Signal peptide: 

amino acids 1-18 

Transmembrane domain : 

amino acids 762-784 
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FIGURE 133 

CCGGGGACATGAGGTGGATACTGTTCATTGGGGCCCTTATTGGGTCCAGCATCTGTGGCC^ 
GAAAAATTTTTTGGGG AC CAAGTTTTGAGGATTAATGT CAGAAATGGAGACGAG AT CAGCAA 

ATTGAGTCAACTAGTGAATTCAAACAACTTGAAGCTCAATTTCTGGAAATCTCCCTCCTCCT 
TCAATCGGCCTGTGGATGTCCTGGTCCCATCTGTCAGTCTGCAGGCATTTAAATCCTTCCTG 
AGAT C C CAGGGCTTAGAGT ACG CAGTGACAATTGAGGAC CTG CAGGCC CTTTTAGACAATGA 

AGATGATGAAATGCAA(^CAATGAAGGGCAAGAACGGAGCAGTAATAACTTCAACTACGGGG 
CTTACCATTCCCTGGAAGCTATTTACCACGAGATGGACAACATTGCCGCAGACTTTCCTGAC 
CTGGCGAGGAGGGTGAAGATTGGACATTCGTTTGAAAACCGGCCGATGTATGTACTGAAGTT 
CAGCACTGGGAAAGGCGTGAGGCGGCCGGCCGTTTGGCTGAATGCAGGCATCCATTCCCGAG 
AGTGGATCTCCCAGGCCACTGCAATCTGGACGGCAAGGAAGATTGTATCTGATTACCAGAGG 
GATCCAGCTATCACCTCCATCTTGGAGAAAATGGATATTTTCTTGTTGCCTGTGGCCAATCC 
TGATGGATATGTGTATACTCAAACTCAAAACCGATTATGGAGGAAGACGCGGTCCCGAAATC 
CTGGAAGCTCCTGCATTGGTGCTGACCCAAATAGAAACTGGAACGCTAGTTTTGCAGGAAAG 
GGAG CC AG CGACAAC C CT TG CT CCGAAGT GTACCATGGAC C CCACG C CAATT CGG AAGTGGA 

GGTGAAATCAGTGGTAGATTTCATCCAAAAACATGGGAATTTCAAGGGCTTCATCGACCTGC 

AC AG CTACT CGCAGCTG CTGATGTATC CAT ATGGGTACTC AGTCAAAAAGGC CC CAGATGCC 

GAGGAACTCGACAAGGTGGCGAGGCTTGCGGCCAAAGCTCTGGCTTCTGTGTCGGGCACTGA 

GTACCAAGTGGGTCCCACCTGCACCACTGTCTATCCAGCTAGCGGGAGCAGCATCGACTGGG 

CGTATGAC^CGGC^TCAAATTTGCATTCACATTTGAGTTGAGAGATACCGGGACCTATGGC 

TTCCTCCTGCCAGCTAACCAGATCATCCCCACTGCAGAGGAGACGTGGCTGGGGCTGAAGAC 

CATC^TGGAGCATGTGCGGGACAACCTCTACTAGGCGATGGCTCTGCTCTGTCTACATTTAT 

TTGTACCCACACGTGCACGCACTGAGGCCATTGT TAAAGGAG CTCTT TCCTACC TG TGTGAG 

TCAGAGCCCTCTGGGTTTGTGGAGCACACAGGCCTGCCCCTCTCCAGCCAGCTCCCTGGAGT 

CGTGTGTCCTGGCGGTGTCCCTGCAAGAACTGGTTCTGCCAGCCTGCTCAATTTTGGTCCTG 

CTGTTTTTGATGAGCCTTTTGTCTGTTTCTCCTTCCACCCTGCTGGCTGGGCGGCTGCACTC 

AGCATCACCCCTTCCTGGGTGGCATGTCTCTCTCTACCTCATTTTTAGAACCAAAGAACATC 

TGAGATGATT CT CT AC C CT CAT CCACAT CTAG CC AAGCCAGTGACCTTGCTC TGGTGGCACT 

GTGGGAGACACCACTTGTCTTTAGGTGGGTCTCAAAGATGATGTAGAATTTCCTTTAATTTC 

TCGCAGTCTTCCTGGAAAATATTTTCCTTTGAGCAGCAAATCTTGTAGGGATATCAGTGAAG 

GTCTCTCCCTCCCTCCTCTCCTGTTTTTTTTTTTTTTGAGAC^GAGTTT^ 

CAGGCTGGAGTGTGATGGCTCGATCTTGGCTCACCACAACCTCTGCCTCCTGGGTTCAAGCA 

ATTCTCCTGCCTCAGCCTCTTGAGTAGCTTGGTTTATAGGCGCATGCCACCATGCCTGGCTA 

ATTTTGTGTTTTTAGTAGAGACAGGGTTTCTCC^TGTTGGTCAGGCTGGTCTCAAACTCCCA 

ACCTCAGGTGATCTGCCCTCCTTGGCCTCCCAGAGTGCTGGGATTACAGGTGTGAGCCACTG 

TGCCGGGCCCGTCCCCTCCTTTTTTAGGCCTGAATACAAAGTAGAAGATCACTTTCCTTCAC 

TGTG CTGAGAATTTCTAGATACTACAGTTCTT ACTC CT CTCTTC CCTTTGTT ATTC AG TGTG 

ACCAGGATGGCGGGAGGGGATCTGTGTCACTGTAGGTACTGTGCCCAGGAAGGCTGGGTGAA 

GTGACCATCTAAATTGCAGGATGGTGAAATTATCCCCATCTGTCCTAATGGGCTTACCTCCT ' 

CTTTGCCTTTTGAACT CACTTCAAAGATCTAGGC CT CATCTTACAGGTCCTAAATCACTCAT 

CTGGCCTGGATAATCTCACTGCCCTGGCACATTCCCATTTGTGCTGTGGTGTATCCTGTGTT 

TCCTTGTCCTGGTTTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTTTGTGTGTGTGTG 

TCTGTCTATTTTGTATCCTGGACCACAAGTTCCTAAGTAGAGCAAGAATTCATCAACCAGCT 

GCCTCTTGTTTCATTTCACCTCAGCACGTACCATCTGTCCTTTTGTTGTTGTTGTTTTGTTT 

TTGTTT TTTTG CTTTTAC CAAACATGTCTGTAAATCTTAAC CTCCTGCCTAGGATTTG TACA 

GCATCTGGTGTGTGCTTATAAGCCAATAAATAITCAATGTGAAAAAAAAAAAAAAAAA 
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FIGURE 134 

MRWI LFIGALIGS S I CGQEKFFGDQVLR INVRNGDE I S KLSQLVNSNNLKLNFWKS PSS FNR 
PVDVLVPSVSLQAFKSFLRSQGLEYAVT IEDLQALLDNEDDEMQHNEGQERS SNNFNYGAYH 
SLEAIYHE^roNIAADFPDIARRVKIGHSFENRPMYVLKFSTGKGVRRPAVWIiNAGIHSREW^ 
SQATAIWTARKIVSDYQRDPAITSILEKMDIFLLPVANPDGYVYTQTQNRLWRKTRSRNPGS 
SCIGADPNRNWNASFAGKGASDNPCSEVYHGPHANSEVEVKSVTO 

S QLLM Y P Y GY S VKKAP DAEE LDKV ARLAAKAL AS V S GTE YQ VG F TCTTVYP AS GS S I DWAYD 
NGI KFAFTFELRDTGTYGFLLPANQ 1 1 PTAEETWLGLKTIMEHVRDNLY 

Signal peptide: 

amino acids 1-16 
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FIGURE 135 

CAAC CATG CAAGGACAGGG CAGGAGAAGAGGAAC CTGCAAAG ACAT ATTTTGTT C C AAA&TG 

GCATCTTACCTTTATGGAGTACTCTTTGCTGTTGGCCTCTGTGCTCCAATCTACTGTGTGTC 

CCCGGCCAATGCCCCCAGTGCATACCCCCGCCCTTCCTCCACAAAGAGCACCCCTGCCTCAC 

AGGTGTATTCCCTCAACACCGACTTTGCCTTCCGCCTATACCGCAGGCTGGTTTTGGAGACC 

CCGAGTCAGAACATCTTCTTCTCCCCTGTGAGTGTCTCCACTTCCCTGGCCATGCTCTCCCT 

TGGGGCCCACTCAGTCACCAAGACCCAGATTCTCCAGGGCCTGGGCTTCAACCTCACACACA 

CACCAGAGTCTGCCATCCACCAGGGCTTCCAGCACCTGGTTCACTCACTGACTGTTCCCAGC 

AAAGACCTGACCTTGAAGATGGGAAGTGCCCTCTTCGTCAAGAAGGAGCTGCAGCTGCAGGC 

AAATTTCTTGGGCAATGTCAAGAGGCTGTATGAAGCAGAAGTCTTTTCTACAGATTTCTCCA 

AC CC CT CCATTG CC CAGG CG AGGATCAACAGC CATGTGAAAAAG AAG AC C C AAGSG AAGGTT 

GTAGACATAATCCAAGGCCTTGACCTTCTGACGGCCATGGTTCTGGTGAATCACATTTTCTT 

T AAAGC CAAG TGGG AG AAG CCCTTTCAC CTTGAATATACAAG AAAG AACT T CC CATT C CT GG 

TGGGCGAGCAGGTCACTGTGCAAGTCCCCATGATGCACCAGAAAGAGCAGTTCGCTTTTGGG 

GTGGATACAGAGCTGAACTGCTTTGTGCTGCAGATGGATTACAAGGGAGATGCCGTGGCCTT 

CTTTGTCCTCC CTAGCAAGGG CAAGATGAGGC AAC TGGAACAGG CCTTGTCAGC CAGAACAC 

TGAT AAAGT GGAGC CACT CACT CC AG AAAAGGTGGATAGAGGTGTT CAT CCCCAGATTTTCC 

ATTTCTGCCTCCTACAATCTGGAAACCATCCTCCCGAAGATGGGCATCCAAAATGCCTTTGA 

CAAAAATG CTGATTTTT CTGGAATTG CAAAGAG AGACT C C CTGCAGGTTTCTAAAG CAACCC 

ACAAGGCTGTGCTGGATGTCAGTGAAGAGGGCACTGAGGCCACAGCAGCTACCACCACCAAG 

TTCATAGTCCGATCGAAGGATGGTCCCTCTTACTTCACTGTCTCCTTCAATAGGACCTTCCT 

GATGATGATT AC AAAT AAAG CC ACAGACGGT ATTCT CTTTCTAGGG AAAGTGGAAAAT CC CA 

C T AAAT C CTAGGT GG GAAAT G G C CTGTT AACT GATGG CACATTG CT AATG CA C AAG AAAT AA 

CAAACCACATCCCTCTTTCTGTTCTGAGGGTGCATTTGACCCCAGTGGAGCTGGATTCGCTG 

GCAGGGATGCCACTTCCAAGGCTCAATCACCAAACGATCAAG 

AAGACCCATTAACCCCAGTGAGTGCCCTTTTCCACAAA 

GGATGTTGCTGGGTTACCATATTTCCATTCCTTGGGGCTCCCAGGAATGGAAATACGCCAAC 
CCAGGTTAGGCAC CT CTATT GC AG AATTACAATAACAC ATT C AATAAAACTAAAATATGAAT 
TCAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA^^ 
AAAAAAA 
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FIGURE 

MAS YL YGVL FAVGLCAP I YC VS PANA P S AY PR P S S TKS T P AS QVYSLNTD FAFRL Y RRL VLE 

TPSQNIFFSPVSVSTSLAMLSLGAHSWKTQILQGLGFNLTHTPESAIHQGFQHLVHSLTVP 

SKDLTLKMGSALFVKKELQLQANFl^NVKRLYEAKVFSTDFSNPSIAQARINSHVKKKTQGK 

VVDIIQGLDLLTAMVLVNHIFFKAKWEXPFHLEYTRKNFPFLVGEQVTVQVPMM^ 

GVDTELNCFVLQMDYKGDAVAFFVLPSKGKMRQLEQALSARTLIKWSHSLQKRWIEVFIP^ 

SISASYNLETILPKMGIQNAFDKNADFSGIAKRDSLQVSKATHKAVLDVSEEGTEATAATTT 

KFIVRSKDGPSYFTVSFNRTFLMMITNKATDGILFLGKVENPTKS 

Signal peptide: 

amino acids 1-20 
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FIGURE 13 7 

GG CT GACCGTGCTACATTG CCTGG AGGAAGCC TAAGGAAC C C AGG C AT C C AGCTGC CCACGC 

CTGAGTCCAAGATTCTTCCCAGGAACACAAACGTAGGAGACCCACGCTCCTGGAAGCACCAG 

CCTTTATCTCTTCACCTTCAAGTCCCCTTTCTCAAGAATCCTCTGTTCTTTGCCCTCTAAAG 

TCTTGGTACATCTAGGAC CCAGGCATCTTGCTTT CCAGC CACAAAGAGAC AGAT GAAGATGC 

AGAAAGGAAATGTT CTCCTTATGTTTGGT CTACTATTGCATTTAGAAG CT GCAACAAATTCC 

AATGAGACTAGCACCTCTGCCAACACTGGATCCAGTGTGATCTCCAGTGGAGCCAGCACAGC 

CACCAACTCTGGGTCCAGTGTGACCTCCAGTGGGGTCAGCACAGCCACCATCTCAGGGTCCA 

GCGTGACCTCCAATGGGGTCAGCATAGTCACCAACTCTGAGTTCCATACAACCTCCAGTGGG 

ATCAGC AC AG CC AC CAACT CTG AGTTCAGCAC AG C GT CC AGTGGGATCAGCATAGC CAC CAA 

CTCTGAGT CCAGCACAAC CTCCAGTGGGGCCAGCACAGCCACCAACTCTGAGTCCAGCACAC 

CCTCCAGTGGGGCCAGCACAGTCACCAA.CTCTGGGTCCAGTGTGACCTCCAGTGGAGCCAGC 

ACTGCCACC^CTCTGAGTCC^GCACAGTGTCC^GTAGGGCC^GCACTGCCACCAACTCTGA 

GTCTAGCACACTCTCCAGTGGGGCCAGCACAGCCACCAACTCTGACTCCAGCACAACCTCCA 

GTGGGGCTAGC^CAGCCACCAACTCTGAGTCC^GC^CAACCTCCAGTGGGGCCAGCACAGCC 

ACCAACTCTGAGTCCAGCACAGTGTCCAGTAGGGCCAGCACTGCCACCAACTCTGAGTCCAG 

CACAACCTCCAGTGGGGCCAGCACAGCCACCAACTCTGAGTCCAGAACGACCTCCAATGGGG 

CTGGCACAGCCACCAACTCTGAGTCCAGCACGACCTCGAGTGGGGCC^^ 

TCTGACTCCAGCACAGTGTCCAGTGGGGCCAG CACTGCCACCAACTCTGAGT CCAGCACGAC 

CTCCAGTGGGGCCAGCACAGCCACCAACTCTGAGTCCAGCACGACCTCCAGTGGGGCTAGCA 

CAGC CACCAACT CTGACT CCAGCACAAC CT CC AGTG GGG C CGG C ACAG CCAC CAACT CTGAG 

TCCAGCACAGTGTCCAGTGGGATCAGCACAGTCACCAATTCTGAGTCCAGCACACCCTCCAG 

TGGGGCCAACACAG CCACCAACTCTGAGT C CAGTACGACCTCCAGTGGGGCC AACACAGCCA 

CCAACTCTGAGTCCAGCACAGTGTCCAGTGGGGCCAGCACTGCCACCAACTCTGAGTCCAGC 

ACAACCTCCAGTGGGGTCAGCACAGCCACCAACTCTGAGTCCAGCACAACCTCCAGTGGGGC 

TAG CACAGCCACCAACT CTGACT C CAGC ACAAC CT CCAGTGAGG CCAGCACAGCCACCAACT 

CTGAGTCTAGCACAGTGT C CAGTGGG AT CAGCAC AGT CACCAATT CTGAGTCCAGCACAACC 

TCCAGTGGGGCCAACAC^GCCACCAACTCTGGGTCC^GTGTGACCrCTGC^GGCTCTGGAAC 

AGCAGCTCTGAC TG GAATG C ACACAACTT CCCATAGTGCAT CTACTG CAGTG AGTG AGGCAA 

AGCCTGGTGGGTCCCTGGTGCCGTGGGAAATCTTCCTCATCACCCTGGTCTCGGTTGTGGCG 

GCCGTGGGGCTCTTTGCTGGGCTCTTCTTCTGTGTGAGAAACAGCCTGTCCCTGAGAAACAC 

CTTTAACACAGCTGTCTACCACCCTCATGGCCTCAACCATGGCCTTGGTCCAGGCCCTGGAG 

GGAATCATGGAGCC C CCCACAGGCCCAGGTGGAGTC CT AACTGGTT CTGGAGGAGACCAGTA 

T CAT CGATAG C C ATGGAG ATGAGCGGGAGGAACAGCGGGC C C2SAGC AGCCC CGGAAGCAAG 

TGCCGC^TTCTTCAGGAATOAAGAGACCTGGGCACCCAAGACCTGGTTTCCTTTCATTCATC 

CCAGGAGAC C CCTCCCAGCTTTGTTTGAGAT C CTGAAAAT CTTG AAGAAGGT ATTCCTCAC C 

TTTCTTGCCTTT ACCAGACACTGGAAAG AGAATACT AT ATTG CTCATT TAGC TAAGAAATAA 

ATAC ATCT CATCT AACACACACGACAAAGAGAAG CTGTGCTTGCCC CG GGGT GGGTAT CTAG 

CTCTGAGATGAACT CAGTT AT AGGAG AAAAC CTC CATG CTGG ACT C CATC TGGC ATTCAAAA 

TCTCCACAGTAAAATCCAAAGACCTCAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 

AAAAAAAAAAAAAAAAAA 
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FIGURE m 

MKMQKGWVLLMFGLIjIjHLEAATNSNETSTSJ^TGSSVISSGASTATNSGSSVTSSGVSTATI 
SGSSVTSNGVSIVTNSEFHTTSSGISTATNSEFSTASSGISIATNSESSTTSSGASTATNSE 
SSTPSSGASTVTNSGSSVTSSGASTATWSESSTVSSRASTATNSESSTLSSGASTATNSDSS 
TTSSGASTATNSESSTTSSGASTATNSESSTVSSRASTATNSESSTTSSGASTATNSESRTT 
S NGAGTATNS E S STTS SGAS T ATN SDS S TV S S GAS T ATNS ES STTS S GASTATNS E SS TT S S 
GASTATNSDSSTTSSGAGTATNSESSWSSGISTVTNSESSTPSSGANTATNSESSTTSSGA 
NTATNSESSTVS SGAS TATNSES STTS SGVSTATNSESSTTSSGASTATNSDSSTTSS EAST 
ATNSESSTVSSGISTVTNSESSTTSSGANTATNSGSSVTSAGSGTAALTG^TTSHSASTAV 
SEAKPGGSLVPWEIFLITLVSWAAVGLFAGLFFCVRNSLSLRNTFNTAVYHPHGLNHGLGP 
GPGGNHGAPHRPRWSPNWFWRRPVSS I AMEMS GRNSG P 

Signal peptide: 

amino acids 1-20 

Transmembrane domain: 

amino acids 510-532 
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FIGURE 139 

GGGAGAGAGGATAAATAGCAGCGTGGCTTCCCTGGCTCCTCTCTGCATCCTTCCCGACCTTC 
CCAGCAATATGCATCTTGCACGTCTGGTCGGCTCCTGCTCCCTCCTTCTGCTACTGGGGGCC 
CTGTCTGGATGGGCGGCCAGCGATGACCCCATTGAGAAGGTCATTGAAGGGATCAACCGAGG 
GCTGAGCAATGCAG AGAGAGAGGTGGG CAAGG CC CTGGATGG CAT C AACAGTGG AATC ACG C 

ATGCCGGAAGGGAAGTGGAGAAGGTTTTCAACGGACTTAGCAACATGGGGAGCCACACCGGC 
AAGGAGTTGGACAAAGGCGTCCAGGGGCTCAACCACGGCATGGACAAGGTTGCCCATGAGAT 

c^ccatggtattggaou^^^ 

ctgctggacaggccgggaaggaagcagacaaagcggtcct^agggttccacactggggtccac 

CAGG CTGGGAAGGAAGCAGAGAAACTTGGC CAAGGGGTCAAC CATGCTGCTGACCAGGCTGG 

AAAGGAAGTGGAGAAGCTTGGCCAAGGTGCCCACCATGCTGCTGGCCAGGCCGGGAAGGAGC 

TGCAGAATGCT C ATAATGGGGTCAACCAAGC CAGCAAGGAGGCCAAC CAGCTGCTGAATGGC 

AACCATCTU^GCGGATCTTCCAGCCATCAAGGAGGGGCCACAACCACGCCGTTAGCC^ 

GGCCTCAGTCAACACGCCTTTCATCAACCTTCCCGCCCTGTGGAGGAGCGTCGCCAACATCA 

TGCCCT^CTGGCATCCGGCCTTGCTGGGAGAATAATGTCGCCGTTGTCACATCAGCTGAC 

ATGACCTGGAGGGGTTGGGGGTGGGGGACAGGTTTCTGAAATCCCTGAAGGGGGTTGTACTG 
GGATTTGTGAATAAACTTGATACACCA 
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FIGURE 140 

></usr /.seqdb2 /sst /DNA/Dnaseqs . min/ss . DNA6 6675 
xsubunit 1 of 1, 247 aa, 1 stop 
><MW: 25335, pi: 7.00, NX(S/T): 0 

MHLARLVGSCSLLLLLGALSGWAASDDPIEKVIEGINRGLSNAEREVGKALDGINSGITHAG 
REVEICVFNGLSNMGSHTGKELDKGVQGLNHGMD^ 

QAGKEADKAVQGFHTGVHQAGKEAEKLGQGVNHAADQAGKEVEKLGQGAHHAAGOAGK^LQN 
AHNGVNQASKEANQIJLiNGNHQSGSSSKQGGATTTPLASGASVNTPFINLPALWRSV 

Important features of the protein: 
Signal peptide: 

amino acids 1-25 

Homologous region to circumsporozoite (CS) repeats: 

amino acids 35-225 
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FIGURE 141 

CTCCGGGTCCCCAGGGGCTGCGCCGGGCCGGCCTGGC^ 

CCCGCGGGGGGCGATGACCGTGCGCTGACCCTGACTCACTCCAGGTCCGGAGGCGGGGGCCCCCGGGGCGACTCG 
GGGGCGGAC CGCGGGG CGGAGCTGCCGCCCGTGAGT CCGGCCGAG CCACCTGAGC CCGAGCCGCGGGACACCGTC 
GCTCCTGCTCTCCGAA^CTGCGCACCGCGATGGGCCTGAGGAGCTXSGCTCGCCGCCCCA^ 

CCCCGGATCAGCCTGCCTCTGGGCTCTGAAGAGCGGCCATTCCTCAGATTCGAAGCT 

ACAGCCCTTCTGCTGAGCAGGGATGGCAGGACCCTGTACGTGGGTC 

AACCTCAGCTTCCTGCCAGGCXSGGGAGTACCAGGAGCTGCTTTGGGGTGCAGACGCy^ 

AGCTTCAAGGGCAAGGAC C CAC?UK:GCGACTG TCAAAACT ACATC AAGAT CCTC CTG C C G CT CAG CGGCAG TCAC 

CTGTTCACCTGTGGCACAGC^CCTTCAGCCCCATGTGTACCTACATCAACATGGA 

GACGAGAAGGGGAATGTCCTCCTGGAAGATGGCAAGGGCCGTTGTCCCT 

CTGGTGGTTGATGGCGAGCTCTACACTGGAACAGTCAGCAGCTTCCAAGGGAAIX^ 

CAAAGCCTTCGCCCCACCAAGACCGAGAGCTCCCTCAACTGGCTGCAAGACCCAGOT 

ATTCCTGAGAGGCTGGGCAGCTTGCAAGGCGATGATGACAAGATCTACTTTTTCTT 

TTTGAGTTCTTTGAGAACACCATTGTGTCCCGCATTGCCCGCATCTGCA^ 

CTACAGCAGCGCTGGACCTCCTTCCTCAAGGCCCAGCTGCTGTGCTCACGGCCCGACGATC 

GTGCTGCAGGATGTCTTCACGCTGAOCCCCAGCCCCCAGGACTOT 

TCCCAGTGGCACAGGGGAACTACAGAAGGCTCT3CCGTCTGTGTCTTCA 

AGCGGCCTCTACAAGGAGGTGAACCGTGAGACACAGCAGTGGTACACCGTGACCCACCCGGTGCCCACACCCCGG 
C C TGGAGCGTGCATCAC CAACAGTGC CCGGGAAAGGAAG AT C AACT CATC CCTGCAGCTCC CAGACCG CGTG CT G 
AACTTCCTCAAGGACCACTTCCTGATGGACGGGCAGOT 

TACCAGCGCGTGGCTGTACACCGCGTCCCTGGCCTGCACCACACCTACGATGTCCT 
GGCCGGCTC CACAAGGCAGTGAGCGTGGGCCCC CGGGTGCACATCATTGAGGAGC^ 
CAGCCCGTGCIAGAATCTGCTCCTGGACACCCACA 
GTGCCCATGGCCAACTGCAGCCTGTACCGGAGCIXSTGGGGACrrc 

AGCGGCTCCAGCTGCAAGCACGTCAGCCTCTACCAGCCTCMCTCGCCACCAGGCCGTGGATCCAGG^ 

GGAGCCAGCGCCAAGGACCTTTGCAGCGCGTCTTCGGITGTGTCCCCGTCTTTTGT^ 

TGTGAGCAAGTCCAGTTCCAGCCCAACACAGTGAACACTTTGGCCTGCCCGCTC 

CTCTGGCTACGCAACGGGGCCCCCGTCAATGCCTCGGCCTCCrGCCACGTGCTACCCACTGGGGA 

GTX3GX3CACCCAAOVGCTGGGGGAGTTCCAGTGCrGGTCACTAGAGGM 

TGC CCAGAGGTGGTGGAGG ACGGGGTGG CAGACC AAACAGATGAGGGTGGCAGTGTACC CGTCATTATCAG CACA 
TCG CGTG TGAGTGC^C CAG CTGGTGGCAAGGCCAGCTC 
ATGTGCACGCTCTTTGTGCTGGCCGTGCTGCTCCCAGTTTTATTCT^ 

CCACTCAACGGCCTAGGGCCCCCTAGCACCCCGCTCGAT^ 

GGGGCCCGAGTCTTCACTGAGTCAGAGAAGAGGCCACTCAGCATCCAAGAC^^ 

TGCCCCCGGCCCCGGGTCCGCCITGGCTCGGAGATCCGTGACTCTGTGGTGT 



ACGACCGTGGTCCCCGGCCCTTGGGAGCCT/TGGAGCCAGCTGGCCTGCTGCTCTC 

TACCACCCAGACACCCAAACAGCCGTGGCCCCAGAGGTCCTGGCCAAATATGGGGGCCTGCCT 

CAGTGCTCCrTTATGTAAACTGAGCCCTTTGTTTAAAAAACAATTCCA 

ATAGCATGGCATGCAGCACACACGGCTGCTCCAGTTCATGGCCTCCCAGGGGTGCTGGGGATG 

TTGTCTGAGACAGAGTTGGAAACCCTCACCAACTGGCCTCTTCACCTTCCACA 

CCTGTCTCACTGCAGATTCAGGACCAGCTTGGGCTGCGTGCGTTCT^ 

TTGCTGCCGTCGTCCCACCACCTCAGGGACCAGAGGGCTAGGTTGGCACTGCGG 

GGACCCAACTCCTGGACCTTTCCAGCCrcTATCAGGCT 

TT TC GT GACAATGT ACGC CTTTC C CT CAGAATTCAGGG AAGAG ACTG TCG C CTGC CTTCCTCCGTTGTTG CGTG A 
GAACCCGTGTGCCCCTTCCCACCATATCCACCCTCGCTCCATCTTTGAACTGA^ 
CTGGTCCTCTCCCCAGTCCCCAGTTCACCCTCCATCCCTCACCTTCCTCCACTCTAAGGGATATC^ 
AGC^CAGGGGCCCTGAATTTATGTGGTTTTTATACATTTTTTAATA 
GTCTGAAGAATTACTGTTTAAAAAAAAAAAA ) 
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FIGURE 142 

>c/usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA67962 
xsubunit 1 of 1, 837 aa, 1 stop 
><MW: 92750, pi: 7.04, NX{S/T): 6 

MLRTAMGLR S WL AA PWGALP PR PP LLLLLLL LLL LQ P P P PTWALS P R I S L PLGS EERPFLRF 
EAEHISNYTALLLSRDGRTLYVGAREALFALSSNLSFLPGGEYQELLWGADAEKKQQCSFKG 
KD PQRD CQNY I K I LLPLS GSHL FTCGTAAF S PMCTY INMENFTLARDE KGNVLLEDGKGRCP 
FDPNFKSTALVVDGELYTGTVSSFQGNDPAISRSQSLRPTKTESS'LNWLQDPAFVASAYIPE 
SLGSLQGDDDKIYFFFSETGQEFEFFENTIVSRIARICKGDEGGERVLQQRWTSFLKAQLLC 
SRPDDGFPFNVLQD VFTLS PS PQDWRDTLFYGVFTSQWHRGTTEGS AVCVFTMKDVQRVFSG 
L Y KE VNRE TQQWYTVTHP VPT PRPG AC I TNS ARERK I N S S LQ L P DRVLNF L KDH FLMDGQ VR 
SRMLLLQPQARYQRVAVHRVPGLHHTYDVLFLGTGDGRLHKAVSVGPRVHI IEELQ I FSSGQ 
PVQNLIJuDTHRGLLYAASHSGWQVPMANCSLYRSCGDCLIJ^DPY^WSGSSCKHVSLYQP 
QLATRPWIQDIEGASAKDLCSASSWSPSFVPTGEKPCEQVQFQPNTVNTLACPI^SNLATR 
LWLRNGAPVNASASCHVLPTGDLLLVGTQQLGEFQCWSLEEGFQQLVASYCPEWEDGVADQ 
TDEGGSVPVI I STSRVSAPAGGKASWGADRS YWKEFLVMCTLFVLAVLLPVLFLLYRHRNSM 
KVFLKQGECASVHPKTCPWLPPETRPLNGLGPPSTPLDHRGYQSLSDSPPGARVFTESEKR 
PLSIQDSFVEVSPVCPRPRVRLGSEIRDSW 

Transmembrane domains: 

amino acids 23-46 (type II), 718-738 
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FIGURE 143A 

CTAAGCCGGAGGATGTGCAGCTGCGGCGGCGGCGCCGGCTACGAAGAGGACGGGGAC^VGGCGCCCTGCGAACCGA 
GCCCAGCCAGCCGGAGGACGCGGGCAGGGCGGGACGGGAGCCCX3GACTCGTCTGCCGCCGCCGTCGTCGCCGTCG 

CG ^CATGGTCCCCTCTTAAAGGCGCAGGCCGCGGCGGCGGGGGCGGGTGTGC^ 

CGGCGCTAGGGCGGGCTGGCCTCCGTGGGCGGGGGCAGCGGGCT 
GGCGGCGGCGGCGGCCCC^GGGCGGAGCGGCGCGGGCA^GGC^ 
TGCTCGGGCTCGTCCTGGGCTTCGTGGTGGCCTCGCGGSCTCGTCCTGCC 



TCGTGGGAGTCATGACCG CCCAGAAATACCTGC AG AC TCGGGCCGTGGC CGCCTACAGAACATGGTCCAA6ACAA 
TTCC7IX3GGAAAGTTCAGTTCrTCTCAAGTGAGGGTTCTGACACATCTGTACCAA 

GTGTGGACGACTCCTACCCGCCCCAGAAGAAGTCCTTCATGATGCTCAAGTACATGCACGACCACTACTT 

AGTATGAATGGTTTATGAGAGCAGATGATGACG7GTACATCAAAGGAGACCGTCTGGAGAACTTCCTGAGG 

TGAACAGCAGCGAGCCCCTCTTTCTTGGGCAGACAGG^ 

AGCCTGGTGAGAACTTCTGC^TGGGGGGGCCTGGCGTGATCATGAGCCGGGAGGTGOT 

ACATTGGCAAGTGTCTCCGGGAGATGTACACCACCCATGAGGACGTGGAGGTC 

CAGGGGTGCAGTGTGTCTGGTCTTATGAGATGCGGCAGCTTT1TTATGAGAATTACGAGCAG 

ACATTAGAGATCTCCATAACAGTAAAATTCACCAAGCTATC^ 

ACAGGCTCCACAGCTAC^TGCTGAGCCGCAAGATATCCGAGCTCCG^ 

TTGTCCTGATGAGCAAATACAGCAACACAGAAATTCATAAAGAGGACCTCCAGCTGGGAATCCC 

TGAGGTTTCAGCCCCGCCAGCGAGAGGAGATTCTGGAATGGGAGTTTCTGACTGGAAA^ 

TTGACGGCCAGCCCCCTCGAAGAGGAATGGACTCCGCCCAGAGGGAA 

TG GAGATGATCAATG C CAACGC CAAG AC CAGAGGG CGCATC ATTGACTTCAAAGAGATC CAGTACGGCT ACCG CC 

GGGTGAACCCCATGTATGGGGCTGAGTACATCCTGGACCTGCTGCT^^ 

TGACGCTCCOTGTGAGWAGGCACGCGTATTTACAGCAGACT 

TG GATG C ACAAGAGTTGGCCAAGAGAATCAAT CAG GAATCTGG ATC CTTGTCCTTTCTCTCAAACTCCCTGAAGA 
AGCTCGTCCCCTTTCAGCTCCCTGGGTCX^GAGTGAGCACAAAGAACCCAAAGATAAAAA^ 
rrCCTTTGTCTGC^CGTTTCGACATGTTTGTGAGATTTATGGGAAACTTTGAGAAGAC 
AGAACGTCAAGCTCGTGGTTCTGCTTTTCAATTCTGACTCC^ 

GAGATTACCGCATTAAGTACCCTAAAGCCGACATGCAGATTTTGCCTGTGTCTCGAGACT 



CAGAATTCCTTCAGCGATGTCGAGCAAATACAGTTCTGGGCCAA^ 

ATGAC CCAAAGATTGTTTATAGTGGGAAAGT TC CCAG TGACAACCATTTTGC CTTT ACTCAGAAAACTGG CTTCT 

GGAGAAACTATGGGTTTGGCATCACGTGTATTTATAAGGGAGATCTTGTCCGAGTGGGT GG CTTTGATGTTTCCA 

TCCAAGGCTG GGGG CTGGAGGATGTGG AC CTTTT CAACAAGGTTGT CCAGGCAGGTTTG AAGACGTTTAGGAG CC 

AGGAAGTAGGAGTAGTCCACGTCCACCATCCTGTCTTTTGTGATCCCAATCTTGACCCCAAACACT^ 

GCTTGGGGTCCAAAGCATCGACCTATGGGTCCACCCAGCAGCTGGCTGAGATGTGGCTGGA 

GTTACAGTAAAAGCAGCAATAATAATGGCTCAGTGAGGACAGCCTAATGTCCAGCTTTGCTG 

TAATTATCTAATTTATTTTT CAAAAATTTTTTGTATGATCAG TT TT TG AAGT CCGTATACAAGGATATATTTTAC 

AAGTGGTTTTCTTACATAGGACTCCTTTAAGATTGAGCT 

CACATCTTCTTGCTGAACATTATGTAGCAGACCTGCTTAACTTTGAC^ 

TTTAAAAAAATGTTITCTTTTGAGACCCTTTX3CTCCAGTCCTATC 

T ^^^^^^^^^^^^^^^^^ T, -^^^ T C TGOT AAAT GT T OT G T TG X G A T'TGTT AT X C CAOAJG1A.TX CTT AC C TT TT C5 X 
GTTTTGTTTTTTTTTTTT ACAATT GTTTTAAA 

GCTGTTTCATCATTGTCTTCAGGAGAGCTTTCCAGAGTTGATCATTTCCTCTCATGGTACT 

CACGTAGGTTTTTTGTTTGTTTTGTTTTGTTCTTTTT^^ 

CAGTGGCGC^VATCTTGGCTGACTTTAACCTCCACTTCCCT 

AGCTGGGATTACAGG C AC ACAC CAC CA.CGC CC!AGNT AGTTTTT TTGTATTTTTAGTAGAGACGGG^ CAT 
G CAAG CC CAG CTGGCCACGTAGGlXri'AAAGCAAGGGGCGTGAAGAAGGCACAGTGAGGTATGTGG 
TGGTAGTTCATTCGGCCTAAATAGACCTGGCATTAAATTTCAAGA^ 
CTCITTAAAGGGTAAAATATTAATGTTTAGAATGACAAAGATGAAT^ 
GAAACATACACACATACACCCTAATCAAAACGTTGGG<3AAAAATGTATTTGGTTTTC 

TGTTAT^^GGGTGGAGATGGTTTTCATTCTTTCA CTGTTTTGTTTTATC CTT TGTATCTGAAATACCTTTAA 

TTTATTTAATATCTG XTGTT CAGAGCTCTGCCATTTCTTGJ^TACCT 

GAGTGTGTTTAGTCTGTTTTATTTGCAGTAAACCGATCTCCAAAGA 



70 
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FIGURE 143B 



TTAATTTTTATATTCCITACTGTTTTACTAAM 

G ACAAAAGTGAAATGAATCTGT CATTATACCAGAAAGTTAAATTCT CAQ ATCAAATGT QCCTTAATAAATTTGTT 
TTCATTTAGATTTCAAACAGTGATAGAC TTG C CATTTTAATACACGT C ATTGGAGGGC TGCGTATTTG TAAATAG 
CCTGATGCTCATTTGGAAAAATAAACCAGTGAACAATATTTTTCTATTGTA 
ATTCCTGTTTTAGCTGAAGAATTGTATTACATTTGGAGAGTAAAAAACTTAAACACGAAAAAA 
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FIGURE 144 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA68836 
xsubunit l of l, 802 aa, l stop 
><MW: 91812, pi: 9.52, NX(S/T): 3 
MAARGRI^WLSVLLGLVLGFVI^ 

GDARGAQLWP PGSDPDGGPRDRNFLFVGVMTAQKYLQTRAVAAYRTWSKTI PGKVQFFSSEG 
SDTSVPIPWPLRGVDDSYPPQKKSFWLKYMHDHYLDKYEWFMRADDDVYIKGDRLENFLR 
SI^SSEPLFLGQTGLGTTEEMGKLALEPGENFCMGGPGVIMSREVLRRMVPHIGKCLREMW 
THEDVEVGRCVRJ^FAGVQCWSYEMRQLFYENYEQNK^ 

YQYRLHSYMLSRKISELRHRTIQLHREIVLMSKYSNTEIHKEDLQLGIPPSFMRFQPRQREE 
ILEWEFLTGK YL YS AVDGQ PPRRGMDSAQREALDD I VMQVMEM I NANAKTRGRI I DF KE IQ Y 

GYRRVNPMYGAEYI LDLLLLYKKHKGKKMTVP VRRHAYLQQTFSKI QFVEHEELDAQEI*^ 

INQESGSLSFLSNSLKKLVPFQLPGSKSEHKEPKDKKINILIPLSGRFDMFVRFMGNFEKTC 
LIPNQNWLWLLFNSDSNPDKAKQVELMROT 

FNNESLLFFCDVDLVFTTEFLQRCRANTVLGQQIYFPIIFSQYTDPKIVYSGKVPSDNHFAFT 
QKTGFWRNYG FG I TC I YKGDLVRVGGFDVS I QGWGLEDVDLFNK WQAGLKTFRSQEVGWH 
VHHPVFCDPNIJDPKQYKMCLGSKASTYGSTQQIiAEMWI^KITO 

Signal peptide: 

amino acids 1-23 
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FIGURE 14 5 

GGACAACCGTTGCTGGGTGTCCCAGGGCCTGAGGCAGGACGGTACTCCGCTGACACCTTCCC 
TTTCGGCCTTGAGGTTCCCAGCCTGGTGGCCCCAGGACGTTCCGGTCGCATGGCAGAGTGCT 
ACGGACGACGCCTATGAAGCCCTTAGTCCTTCTAGTTGCGCTTTTGCTATGGCCTTCGTCTG 
TGCCGGCTTATCCGAGCATAACTGTGACACCTGATGAAGAGCAAAACTTGAATCATTATATA 
CAAGTTTTAGAGAACCTAGT ACGAAGTGTT C C CTCTGGGG AG CCAGGT CGTGAG AAAAAATC 

taactctccaaaacatgtttattctatagcato^ 

CACATGGAGACG CTTC AACTGAG AATGATGTTTTAAC C AAT C CTATCAGTGAAGAAACTACA 
ACT TT C CCTACAGGAGGCT TCACACCGG AAATAGGAAAGAAAAAACACACGGAAAGTAC C CC 
ATTCTGGTCGATCAAACCAAACAATGTTTCCATTGTTTTGCATGCAGAGGAACCTTATATTG 
AAAATGAAGAGCCAGAGCCAGAGCCGGAGCCAGCTGCAAAACAAACTGAGGCACCAAGAATG 
TTGCCAGTTGTTACTGAATCATCTACAAGTCCATATGTTACCTCATACAAGTCACCTGTCAC 
CACTTTAGATAAGAGCACTGGCATTGAGATCTCTACAGAATCAGAAGATGTTCCTCAGCTCT 
CAGGTG AAACTGCG ATAGAAAAACC CGAAGAGTTTGGAAAGCAC CCAG AGAGTTGGAATAAT 
GATGACATTTTGAAAAAAATTTTAGATATTAATT CACAAGTGCAACAGGC AC TT CTTAGTGA 
CACCAGCAACCCAGCATATAGAGAAGATATTGAAGCCTCTAAAGATCACCTAAAACGAAGCC 
TTGCTCTAGCAG CAG CAG CAGAACAT AAATTAAAAACAATGT ATAAGTC C CAGTTAT TGCCA 
GTAGGACGAACAAGTAATAAAATTGATGACATCGAAACTGTTATTAACATGCTGTGTAATTC 
TAGATCTAAACTCTATGAATATTTAGATATTAAATGTGTTCCACCAGAGATGAGAGAAAAAG 
CTGCTACAGTATTCAATACATTAAAAAATATGTGTAGATCAAGGAGAGTCACAGCCTTATTA 
AAAGTTTATTAMCAATAATATAAAAATTTTAAACCTACTTGATATTCCATAACAAAGCTGA 
TTTAAGCAAACTGCATTTTTTGACAGGAGAAATAATCATATTCGTAATTTCAAAAGTTGTAT 
AAAAATATTTTCTATTGTAGTTC^^TGTGCC^CATCTTTATGTGTCATGTGTTATGAAC^ 
ATTTTCATATGC^CTAAAAACCTAATTTAAAATAAAATTTTG GTT CAGGAAAAAA 
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FIGURE 146 

></usr/seqdb2/sst/DNA/Driaseqs . min/ss . DNA68864 
xsubunit l of l, 350 aa, I stop 
><MW: 39003, pi: 5.59, NX(S/T) : 1 
MKPLVIiVALIiLWPSSVPAYPSITVTPD^ 

HVYSIASKGSKFKELVTHGDASTENDVLTNPISEETTTFPTGGFTPEIGKKKHTESTPFWSI 

KPNNVS I VLHAEEP YI ENEEPEPEPE PAAKQTE APRMLP WTES STS PYVTSYKS PVTTLDK 

STG I E I STESEDVPQLSGETAI EKPEEFGKHPESWNNDDI LKKILDINSQVQQALLSDTSNP 

AYREDIEASK2}HLKRSLAIJWU\EHKLKT^ 

YE YLD I KCVP PEMREKAATVFNTLKNMCRSRRVTALLKVY 

Signal peptide: 
amino acids 1-19 
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FIGURE 147 

CGGCTCGAGCGGCTCGAGTGAAGAGCCTCTCCACGGCTCCTGCGCCTGAGACAGCTGGCCTG 

ACCTCCAAATCATCCATCCACCCCTGCTGTCATCTGTTTTCATAGTGTGAGATCAACCCACA 

GGAATATCC^^CTTTTGTGCTCATTTTGGTTCTCAGTTTCTACGAGCTGGTGTCAGGACA 

GTGGCAAGTCACTGGACCGGGCAAGTTTGTCCAGGCCTTGGTGGGGGAGGACGCCGTGTTCT 

CCTGCTCCCTCTTTCCTGAGACCAGTGCAGAGGCTATGGAAGTGCGGTTCTTCAGGAATCAG 

TTCCATGCTGTGGTCCACCTCTACAGAGATGGGGAAGACTGGGAATCTAAGCAGATGCCACA 

GTATCGAGGGAGAACTGAGTTTGTGAAGGACTCCATTGCAGGGGGGCGTGTCTCTCTAAGGC 

TAAAAAACATCACTCCCTCGGACATCGGCCTGTATGGGTGCTGGTTCAGTTCCCAGATTTAC 

GATGAGGAGGCCACCTGGGAGCTGCGGGTGGCAGCACTGGGCTCACTTCCTCTCATTTCCAT 

CGTGGGATATGTTGACGGAGGTATCCAGTTACTCTGCCTGTCCTCAGGCTGGTTCCCCCAGC 

CC ACAG C CAAGTG GAAAGGT CCACAAGG ACAGGATTTGTCTTCAGACTCCAGAGCAAATGCA 

GATGGGTACAGC CTG TATGATG TGGAGATCT C CATTATAGTCCAGGAAAATG CTGGGAGCAT 

ATTGTGTTC CAT CCAC CTTG CTGAGCAGAGTCATGAGGTGGAATCCAAGGTATTGATAGGAG 

AGACGTTTTTCCAGCCCTCACCTTGGCGCCTGGCTTCTATTTTACTCGGGTTACTCTGTGGT 

GCCCTGTGTGGTGTTGTCATGGGGATGATAATTGTTTTCTTCAAATCCAAAGGGAAAATCCA 

GG CGGAACTGGA C TGG AGAAGAAAGCACGGACAGGCAGAATTGAGAGA CG CCCGGAAACACG 

CAGTGGAGGTGACTCTGGATCCAGAGACGGCTCACCCGAAGCTCTGCGTTTCTGATCTGAAA 

ACTGTAACCCAT AGAAAAG CT CCCCAGGAG GTGCCT CACTCTGAGAAGAGATTTAC AAGGAA 

GAGTGTGGTGGCTTCTCAGGGTTTCCAAGCAGGGAGACAT TACTGGGAG GTGGACGTGGGAC 

AAAATGTAGGGTGGTATGTGGG AGTGTGTC GG GATG ACGT AGACAGGGGG AAGAACAATGTG 

ACTTTGTCTCCCAACAATGGGTATTGGGTCCTCAGACTGACAACAGAACATTTGTATTTCAC 

ATTCAATCCCCATTTTATCAGCCTCCCCCCCAGCACCCCTCCTACACGAGTAGGGGTCTTCC 

TGGACTATGAGGGTGGGA CCAT CTC CTT CTTCAATACAAATGAC CAGTC CCTTATTTATACC 

CTGCTGACATGT CAGT TT GAAGG CTTGTTGAGAC C CTATATC CAGCATGCGATGTATGACGA 

GGAAAAGGGGACTC CCATATTCATATGT C CAGTGTC CTGGGG ATgAGACAGAGAAGACCCTG 

CTTAAAGGGCCCCACACCACAGACCCAGACACAGCCAAGGGAGAGTGCTCCCGACAGGTGGC 

CCCAGCTTCCTCTCCGGAGCCTGCGCACAGAGAGTCACGCCCCCCACTCTCCTTTAGGGAGC 

TG AGGTTCTT CTGC CCTG AG C CCTGCAGCAGCGG CAGT CACAGCTT CCAGATGAGGGGGG AT 

TGG C CTGA CC CT GT GGGAG T CAG AAG C CAT GG CT G C CCTGAAGTGGG GACGGAATAGACT CA 

CATTAGGTTTAGTTTGTGAAAACTCCATCCAGCrAAGCGATCTTGAACAAGTCACAACCTCC 

CAGGCTCCTCATTTGCTAGTCACGGACAGTGATTCCTGCCTCACAGGTGAAGATTAAAGAGA 

CAACGAATGTGAAT CATG CTTGCAGGTTTGAGGGCACAGTGTTTGCTAATGATGTGTTTTTA 

T AT T ATACAT TT T C C C AC CATAAACT C T GTT TG CTT ATT C CA CATT AATT TACTTT T CT CT A 

TACCAAAT C ACCCATGGAATAGTTATTGAACACCTG CTTTGTGAGG CT CAAAGAAT AAAGAG 

GAGGTAGGATTTTTCACTGATTCTATAAGCCCAGCATTACCTGATACCAAAACCAGGC^^ 

AAAACAGAAGAAGAGGAAGGAAAACTACAGGT CCATATCC CTCATTAACACAGACACAAAAA 

TTCTAAATAAAATTTTAACAAATTAAACTAAACAATATATTTAAAGATGATATATAACTACT 

CAGTGTGGTTTGTCCCACAAATGCAGAGTTGG1TTAATATTTAAATATCAACCAGTGTAATT 

CAG CACATTAATAAAGTAAAAAAGAAAACCATAAAAAAAAAAAAAAA 
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FIGURE 148 



></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA68866 
xsubunit 1 of 1, 466 aa, 1 stop 
><MW: 52279, pi: 6.16, NX(S/T): 2 

MAFVLILVLSFYELVSGQWQVTGPGKFVQALVGEDAVFSCSLFPETSAEAMEVRFFRNQFHA 
VVHLYRIX3EDWESKQMPQYRGRTEFVKDSIAGGRVSLRLKNITPSDIGLYGCWFSSQIYDEE 
ATWELRVAALGSLPLISIVGYVDGGIQLLCLSSGWFPQPTAKWKGPQGQDLSSDSRANADGY 
SLYDVE IS 1 1 VQENAGS I LCS IHLAEQSHEVESKVL IGETFFQPS PWRLAS I LLGLLCGALC 
GVVMGMIIVFFKSKGKIQAELDWRRIOTGQAELRDARKHAVEVTLDPETAHPKLCTSDLKTVT 
HRKAPQEVPHSEKRFTRKSWASQGFQAGRHYWEVDVGQNVG 

PNNG YWVLRLTTEHL YFT FNPHF ISLPPSTP PTRVG VF LD YE GGT I S F FNTNDQ §L I YTLLT 
CQFEGLLRPYIQHAMYDEEKGTPIFICPVSWG 

Signal peptide: 

amino acids 1-17 

Transmembrane domains : 

amino acids 131-150, 235-259 
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FIGURE 149 

C CTT CACAGGACTCTT CATTG CTGGTT GGCAATgATGTAT CGGCCAGATGTGGTGAGGGCTA 
GGAAAAGAGTTTGTTGGGAACCCTGGGTTATCGGCCTCGTCATCTTCATATCCCTGATTGTC 
CTGGCAGTGTGCATTGGACTCACTGTTCATTATGTGAGATATAATCAAAAGAAGACCTACAA 
TTACT ATAGCACATTGT CATTTACAACTGA CAAACTATATGCTGAGTT TGGCAGAGAGGCTT 
CTAACAATTT TACAGAAATG AG CGAGAGACTTGAAT CAATGGTG AAAAATGCATTTTATAAA 
TCTCCATTAAGGGAAGAATTTGTCAAGTCTGAGGTTATCAAGTTCAGTCAACAGAAGCATGG 
AGTGTTGGCTCATATGCTGTTGATTTGTAGATTTCACTCTACTGAGGATCCTGAAACTGTAG 
ATAAAATTGTTCAACTTGTTTTACATGAAAAGCTGCAAGATGCTGTAGGACCCCCTAAAGTA 
GATCCTCACT CAGTTAAAATTAAAAAAATC AACAAG ACAG AAACAGACAGCTATCTAAAC CA 
TTGCTG CGGAACACG AAGAAGT AAAAGT CTAGGT C AG AGTCT CAGGAT CGTTGGTGGGACAG 
AAGT AGAAGAGGGT GAATGGCC CTGGCAGG CT AG CCTGCAGTGGGATGGGAGT CATCGCTGT 
GGAGCAACCTTAATTAATGCCACATGGCTTGTGAGTGCTGCTCACTGTTTTACAACATATAA 
GAAC CCTG CCAGAT GGACTGCTT C CTTTGGAGTAACAATAAAACCTT CGAAAATGAAACGGG 
GTCTCCGGAGAATAATTGTCCATGAAAAATACAAACACCCATCACATGACTATGATATTTCT 
CTTGCAGAGCTTTCTAGCCCTGTTCCCTACACAAATGCAGTACArAGAGTTTGTdTCCCTGA 
TGCATCCTATGAGTTTCAACCAGGTGATGTGATGTTTGTGACAGGATTTGGAGCACTGAAAA 
ATGATGGTTACAGTCAAAATCATCTTCGACAAGCACAGGTGACTCTCATAGACGCTACAACT 
TGCAATGAACCTCAAGCTTACAATGACGCCATAACTCCTAGAATGTTATGTGCTGGCTCCTT 
AGAAGGAAAAACAGATGCATGCCAGGGTGACTCTGGAGGACCACTGGTTAGTTCAGATGCTA 
GAGATATCTGGTACCTTGCTGGAATAGTGAGCTGGGGAGATGAATGTGCGAAACCCAACAAG 
CCTGGTGTTTATACTAGAGTTACGGC CTTG CGGG ACTGGATT ACTT CAAAAA CTGGTAT CTA 
AGAGACAAAAGCCTCATGGAACAGATAACATTTTTTTTTGTTTTTTGGGTGTGGAGGCCATT 
TTTAGAGATACAGAATTGGAGAAGACTTG CAAAACAGCTAGATTTGACTGAT CT CAATAAAC 
TGTTTGCTTGATGCATGTATTTTCTT CC CAGCTCTGTT CCGCACGTAAGCAT CCTG CTTCTG 
CCAGATC^CTCTGTCATCTGTGAGCAATAGTTGAAACTTTATGTACATAGAGAAATAGATA 
ATACAATATTACATTACAGC CTGT ATTCATTTGTTCT CTAGAAGTTTTGTCAGAATTTTGAC 
TTGTTGACATAAATTTGTAATGCATATATACAATTTGAAGCACTCCTTTTCTTCAGTTCCTC 
AGCTCCTCTCATTTCAGCAAATATCCATTTTCAAGGTGCAGAACAAGGAGTGAAAGAAAATA 
TAAGAAGAAAAAAATCCCCTACATTTTATTGGCACAGAAAAGTATTAGGTGTTTT^CTTAGT 
GG AATATT AG AAATG AT C AT ATTCATTAT GAAAGGT CAAGCAAAGACAGCAGAATACCAATC 
AC TT CAT C ATTT AGGAAGTATGGGAACTAAGTTAAGGAAGTCCAGAAAGAAGCCAAGATATA 
TC CTTATTTT CAT TTC CAAACAACTACT ATGATAAATGTGAAGAAGATT CTGTTTTTTTGTG 
ACCTATAATAATTATACAAACTTCATGCAATGTACTTGTTCTAAGCAAATTAAAGCAAATAT 
TTATTTAACATTGT T ACTGAGGATGTCAAC ATATAACAATAAAATATAAATCAC CCA 
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FIGURE ISO 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA68a71 
xsubunit 1 of - 1, 423 aa # 1. stop 
><MW: 47696, pi: 8 . 96 , NX (S/T) : 3 

MMYRPD WRARKRVCWE PWV IGLV I F I S L I VL AVC I GLTVHYVRYNQKKTYKYYSTLS FTTD 

KLYAEFGREASNNFTEMSQRLESMVKNAFYKSPLREEFVKSQVIKFSQQKHGVIAH^ 

FHSTEDPETVDKI VQLVLHEKLQDAVGPPKVD PHSVKI KKINKTETDSYLNHCCGTRRSKTL 

GQSLRIVGGTEVEEGEWPWQASLQWDGSHRCGATLINATWLVSAAHCFTTYKNPARWTASFG 
VTIKPSKMKRGLRRI IVHEKYKHPSHDYD^^ 

MFVTGFGALKNDGYSQNHLRQAQVTLIDATTCNEPQAYNDAITPRMLCAGSLEGKTDACQGD 
SGGPLVSSDARDIWYLAGIVSWGDECAKPNKPGVYTRVTALRDWITSKTGI 

Transmembrane domain: 

amino acids 21-4 0 (type II) 
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FIGURE 15 1 

GTCGAAGGTTATAAAAGCTTCCAGCCAAACGGCATTGAAGTTGAAGATACAACCTGACAGCA 
CAGCCTGAGATCTTGGGGATCCCTCAGCCTAACACCC1ACAGACGTCAGCTGGTGGATTCCCG 
CTGCATC^GGCCTACCCACTGTCTCC^EGCTGGGCTCTCCCTGCCTTCTGTGGCTCCTGGC 
CGTGACci j.u ri'GGTTCCCAGAGCT CAG CC CTTGGC C C CTCAAGACTTTGAAGAAG AGGAGG 
CAGATGAGACTGAGACGGCGTGGCCGCCTTTGCCGGCTGTCCCCTGCGACTACGACCACTGC 
CGACACCTGCAGGTGCCCTGCAAGGAGCTACAGAGGGTCGGGCCGGCGGCCTGCCTGTGCCC 
AGGACTCTCCAGCCCCGCCCAGCCGCCCGACCCGCCGCGCATGGGAGAAGTGCGCATTGCGG 
CCGAAGAGGGCCGCGCAGTGGTCCACTGGTGTGCCCCCTTCTCCCCGGTCCTCCACTACTGG 
CTGCTGCTTTGGGACGGCAGCGAGGCTGCGCAGAAGGGGCCCCCGCTGAACGCTACGGTCCG 
CAGAGCCGAACTGAAGGGGCTGAAGCCAGGGGGCATTTATGTCGTTTGCGTAGTGGCCGCTA 
ACGAGGCCGGGGCAAGCCGCGTGCCCCAGGCTGGAGGAGAGGGCCTCGAGGGGGCCGACATC 
CCTGCCTTCGGGCCTTGCAGCCGCCTTGCGGTGCCGCCCAACCCCCGCACTCTGGTCCACGC 
GG CCGT CGGGGTGGG CACGG CCCTGGCCCTGCTAAGCTGTGCCG C C CTGG TGTGG C A CTTCT 

GCCTGCGCGATCGCTGGGGCTGCCCGCGCCGAGCCGCCGCCCGAGCCGCAGGGGCGCTCTGA 
AAGGGGCCTGGGGGCATCTCGGGCACAGACAGCCCCACCTGGGGCGCTCAGCCTGGCCCCCG 
GGAAAGAGGAAAACCCGCTGCCTCCAGGGAGGGCTGGACGGCGAGCTGGGAGCCAGCCCCAG 
GCTCCAGGGCCACGGCGGAGTCATGGTTCTCAGGACTGAGCGCTTGTTTAGGTCCGGTACTT 
GGCGCTTTGTTTCCTGGCTGAGGTCTGGGAAGGAATAGAAAGGGGCCCCCAATTTTTTTTTA 
AGCGGCCAGATAATAAATAATGTAAC CTTTGCGGTTAAAAAAAAAAAAAAAAAA 
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FIGURE 152 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA68874 
xsubunit 1 of 1, 238 aa, 1 stop 
><MW: 25262, pi: 6.44, NX(S/T): 1 
M^SPCLLWLLAVTFLVPRAQPIAPQDFEEEEADETETAW 

LQRVGPAACLCPGLSSPAQPPDPPRMGEVRIAAEEGRAWHWCAPFSPVLHYWLLLWDGSEA 
AQKGPPLNATVRRAELKGLKPGGI YVVCVVAANEAGASRVPQAGGEGLEGAD I PAFGPCSRL 
AVPPNPRTLVHAAVGVGTALALLSCAALVWHFCLRDRWGCPRRAAARAAGAL 

Important features of the protein: 
Signal peptide: 

amino acids 1-20 

Transmembrane domain: 

amino acids 194-220 

N-glycosylation site. 

amino acids 132-135 
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FIGURE 15$ 

AGAGAAAGAAGCGTCTCCAGCTGAAGCCAATGCAGCCCTCCGGCTCTCCGCGAAGAAGTTCC 

CTGCCCCGATGAGCCCCCGCCGTGCGTCCCCGACTATCCCCAGGCGGGCGTGGGGCACCGGG 

CCCAGCGCCGACGATCGCTGCCGTTTTGCCCTTGGGAGTAGGATGTGGTGAAAGGATGGGGC 

TTCTCCCTTACGGGGCTCACAATGGCCAGAGAAGATTCCGTGAAGTGTCTGCGCTGCCTGCT 

CTACGCCCTCAATCTGCTCTTTTGGTTAATGTCCATCAGTGTGTTGGCAGTTTCTGCTTGGA 

TGAGGGACTAC CTAAATAATGTTCTCACTTTAACTG CAGAAACG AGGGTAGAGGAAGCAGTC 

ATTTTGACTTACTTT CCTGTGGTT CATC CGGTCATGATTGCTGTTTGCTGTTTCCTTATCAT 

TGTGGGGATGTTAGGATATTGTGGAACGGTGAAAAGAAATCTGTTGCTTCTTGCATGGTACT 

TTGGAAGTTTGCTTGTCATTTTCTGTGTAGAACTGGCTTGTGGCGTTTGGACATATGAACAG 

GAACTTATGGTTCCAGTACAATGGTCAGATATGGTCACTTTGAAAGCCAGGATGACAAATTA 

TGGATTAC CTAGATATCGGTGGCTTACT CATGCTTGGAATTTTTTTCAGAGAGAGTTTAAGT 

GCTGTGGAGT AGTATATTTCACTGAC TGGTTGGAAATGACAG AG ATGGACTGGC CC C CAGAT 

TC CTGCTGTGTTAG AGAATT C C CAGG ATGTTCCAAACAGGC CCAC CAGG AAGATCT CAGTGA 

CCTTTATCAAGAGGGTTGTGGGAAGAAAATGTATTCCTTTTTGAGAGGAACCAAACAACTGC 

AGGTGCTGAGGTTTCTGGGAATCTCCATTGGGGTGACACAAATCCTGGCCATGAl'TCTCACC 

ATTACTCTGCTCTGGGCTCTGTATTATGATAGAAGGGAGCCTGGGACAGACCAAATGATGTC 

CTTGAAGAATGACAACTCTCAGCACCTGTCATGTCCCTCAGTAGAACTGTTGAAACCAAGCC 

TGTCAAGAATCTTTGAACACACATCCATGGCAAACAGCTTTAATACACACTTTGAGATGGAG 

GAG TTATA^AAAGAAATGTCACAGAAGAAAACCA CAAACTTGT TTTATTGGACTTGTGAATT 

TTTGAGTACATACTATGTGTTTCAGAAATATGTAGAAATAAAAATGTTGCCATAAAATAACA 

CCTAAGCATATACTATTCTATGCTTTAAAATGAGGATGGAAAAGTTTCATGTCATAAGTCAC 

CACCTGGACAATAATTGATG C C CTTAAAATGCTGAAGA CAGAT GTCATACCC ACTGTGTAGC 

CTGTGTATGACTTTTACTGAAC ACAGTTATGT TT TGAG GCAGCATGGTTT GATTAG CATTTC 

CGCAT C CATGCAAACG AGTCAC AT ATGGTGGG ACTGGAGC CATAGT AAAGGTTGATTTACTT 

CTACCAACTAGTATATAAAGTACTAATTAAATGCTAACATAGGAAGTTAGAAAATACTAATA 

ACTTTTATTACTCAGCGATCTATTCTTCTGATGCTAAATAAATTATATATCAGAAAACTTTC 

AATATTGGTGACTACCTAAATGTGATTTTTGCTGGTTACTAAAATATTCTTACCACTTAAAA 

GAGCAAGCTAAGACATTGTCTTAAGCTGATCAGGGATTTTTTGTATATAAGTCTGTGTTAAA 

T CTGTATAATTGAGTCGATTTCAGTT CTGATAATGTTAAGAATAACCATTATGAAAAGGAAA 

ATTTGTCC TGTATAGCATCATTAT TTTTAGCCTTTCCTGTT AATAAAG CTTTACTATTCT GT 

CCTGGG CT TATATT ACACATAT AACTGTTATTTAAATACITAACCACTAATT TTGAAAATTA 

CCAGTGTGATACATAGGAATCATTATTCAGAATGTAGTCTGGTCTTTAGGAAGTATTAATAA 

GAAAAT TTG CACATAACTTAGTTGATTCAGAAAGGACTTGTATGCTGTTTTT CTCCCAAATG 

AAGACTCTTTTTGACACTAAACACTTTTTAAAAAGCTTATCTTTGCCTTCTC 

GCAATAGT CT CCAAGT CAATAT AAATTCTAC AGAAAAT AGTGTTC TTTTT CT C CAGAAAAAT 

GCTTGTG AGAAT CATTAAAACATGTGACAATTT AGAG ATT CTTTG TTTTATTTCACTGATTA 

ATATACTGTGGGAAATTACACAGATTATTAAATTTTTTTACAAGAGTATAGTATATTTATTT 

GAAATGGGAAAAGTGCATTTTACTGTATTTTGTG TATTTTGTTTAT TTCT CAGAATATGGAA 

AGAAAATTAAAATGTGT CAATAAATATTTTC TAGAGAGT AA 
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FIGURE 154 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA68880 
xsubunit 1 of 1, 305 aa, 1 stop 
><MW: 35383, pi: 5.99, NX(S/T): 0 

MAREDSVKCLRCLLYAI^LLFWLMSISVLAVSAWMRDYLNNVLTLTAETRVEEAV 

VHPVMIAVCCFLIIVGMLGYCGTVKRNLLLIA^ 

WSDMVTLKARMTNYGLPRYRWLT^ 

PGCSKQAHQEDLSDLYQEGCGKKOTSFLRGTKQLQVLRFLGISIGVTQIIiAMILTITLLW^ 
YYDRREPGTDQMMSLKNDNSQHLSCPSVELLKPSLSRIFEHTSMANSFNTHFEMEEL 

Signal peptide: 

amino acids 1-3 3 

Transmembrane domains: 

amino acids 12-35, 57-86, 94-114, 226-248 
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FIGURE 1*5 

GAG AGAGGCAGCAG CTTG CTCAG CGGACAAGGATGCTGGG CGTGAGGG ACCAAGGC CTGC C C 

TGCACTCGGGCCTCCTCCAGCCAGTGCTGACCAGGGACTTCTGACCTGCTGGCCAGCCAGGA 

CCTGTGTGGGGAGGCCCTCCTGCTGCCTTGGGGTGACAATCTCAGCTCCAGGCTACAGGGAG 

ACCGGGAGGATCACAGAGCCAGCATGTTACAGGATCCTGACAGTGATCAACCTCTGAACAGC 

CTCGATGTCAAACCCCTGCGCAAACCCCGTATCCCCATGGAGACCTTCAGAAAGGTGGGGAT 

CCCCATCATCATAGCACTACTGAGCCTGGCGAGTATCATCATTGTGGTTGTCCTCATCAAGG 

TGATTCTGGATAAATACTACTTCCTCTGCGGGCAGCCTCTCCACTTCATCCCGAGGAAGCAG 

CTGTGTGACGGAGAGCTGGACTGTCCCTTGGGGGAGGACGAGGAGCACTGTGTCAAGAGCTT 

CCCCGAAGGGCCTGCAGTGGCAGTCCGCCTCTCCAAGGACCGATCCACACTGCAGGTGCTGG 

ACTCGGCCACAGGGAACTGGTTCTCTGCCTGTTTCGACAACTTCACAGAAGCTCTCGCTGAG 

ACAGC CTGT AGG CAGATGGG CTACAG CAGAGCTGTGGAGATTGGC C C AGACCAGGATCTGGA 

TGTTGTTGAAAT CACAGAAAACAGCCAGGAGCTTCGCATGCGGAACT CAAGTGGGCCCTGTC 

TCTCAGGCTCCCTGGTCTCCCTGCACTGTCTTGCCTGTGGGAAGAGCCTGAAGACCCCCCGT 

GTGGTGGGTGGGGAGGAGGCCTCTGTGGATTCTTGGCCTTGGCAGGTCAGCATCCAGTACGA 

CAAACAGCACGTCTGTGGAGGGAGCATCCTGGACCCCCACTGGGTCCTCACGGCAGCCCACT 

GCTTCAGGAAACATACCGATGTGTTCAACTGGAAGGTGCGGGCAGGCTCAGACAAACTGGGC 

AGCTTCCCATCCCTGGCTGTGGCCAAGATCATCATCATTGAATTCAACCCCATGTACCCCAA 

AGACAATGACATCGCCCTCATGAAGCTGCAGTTCCCACTCACTTTCTCAGGCACAGTCAGGC 

CCATCTGTCTGCCCTTCTTTGATGAGGAGCTCACTCCAGCCACCCCACTCTGGATCATTGGA 

TGGGGCTTTA CGAAGCAGAATGGAGGGAAGATGT CTGACATACTGCTG CAGGCGT CAGTC CA 

GGTCATTGACAGCACACGGTGCAATG CAGACGATG CGTAC CAGGGGGAAG T CAC CGAGAAGA 

TGATGTGTGCAGGCATCCCGGAAGGGGGTGTGGACACCTGCCAGGGTGACAGTGGTGGGCCC 

CTGATGTACCAATCTGACCAGTGGCATGTGGTGGGCATCGTTAGCTGGGGCTATGGCTGCGG 

GGGCCCGAGCACCCCAGGAGTATACACCAAGGTCTCAGCCTATCTCAACTGGATCTACAATG 

TCTGGAAGGCTGAGCTGTAATGCTGCTGCCCCTTTGCAGTGCTGGGAGCCGCTTCCTTCCTG 

CCCTGC CCAC CTGGGGAT CC CC CAAAGTCAGACACAGAG C AAGAGTCCC CTTGGGTACAC CC 

CTCTGCCCACAGCCTCAGCATTTCTTGGAGCAGCAAAGGGCCTCAATTCCTGTAAGAGACCC 

T C GCAG CC CAGAGGCG CC CAGAGGAAGT CAGC AGC C CTAGCT CGGCCACACTTGGTGCT CCC 

AGCAT C CC AGGG AGAGACAC AG CC CACTGAACAAG GTCTCAGGGGTATTG CTAAG CCAAGAA 

GGAA CTTT CCCACAC TACTGAATGGAAGCAGG CTGTCTTGTAAAAGCCCAGAT CACTGTGGG 

CTGGAGAGGAGAAGGAAAGGGTCTGCGCCAGCCCTGTCCGTCTTCACCCATCCCCAAGCCTA 

CTAGAG CAAGAAAC CAGTTGTAATATAAAATGCACTGCCCTACT GTTGGTATGACT AC CGTT 

ACCTACTGTTGTCATTGTTATTACAGCTATGGCCACTATTATTAAAGAGCTGTGTAACATCT 
CTGGCAAAAAAAAAAAA 
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FIGURE 156 

>< /usr /seqdb2 /sst /DNA/Dnaseqs . min/ss . DNA6 8 8 8 5 
xsubunit 1 of 1, 432 aa, 1 stop 
><MW: 47644, pi: 5.18, NX(S/T): 2 

MLQDPDSDQPLNSLDVKPLRKPRIPMETFRKVGIPIIIALLSLASIIIWVLIKVILDKYYF 
LCGQPLHFIPRKQLCDGELDCPLGEDEEHCVKSFPEGPAVAVRLSKDRSTLQVLDSATGNWF 
SACFDNFTEALAETACRQMGYSRAVEIGPDQDLDWEITENSQELRMRNSSGPCLSGSLVSL 
HCLACGKSLKTPRWGGEEASVDSWPWQVS IQYDKQHVCGGS ILDPHWVLTAAHCFRKHTDV 
FNWKVRAGSDKLGSFPSLAVAKI 1 1 IEFNPMYPKDNDIALMKLQFPLTFSGTVRPICLPFFD 

EELTPATPLWI IGWGFTKQNGGKMSDILLQASVQVIDSTRCNADDAYQGEVTEKMMCAGI PE 
GGVDTCQGDSGX3PLNnfQSIX2WHWGIVSW 

Transmembrane domain: 

amino acids 32-53 (typell) 
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FIGURE 157 

GGGCTGAGGCACTGAGAGACCGGAAAGCCTGGCATTCCAGAGGGAGGGAAACGCAGCGGCATCCCCAGGCTCCAG 

AGCTCCCTGGTGACAGTCTGTGGCTGAGCATGGCCCTCCCAGCCCTGGGCCTGGACCCCTGGAGCCTCCTC 

TTTTCCTCTTCCAACTGCTTCAGCTGC^ 

GGGTCAGATACTATGCAGGGGATGAACGTAGGGCACTTAGCTTCTTCCACCAGAAGGG 

CTCTGCTCCTCiAGTGGTGATGGAAATACTCTCTACGTGGGGGCTCGAGAAGCCATTCTGGCCTTGGATAT^ 

ATCCAGGGGTCCCCAGGCTAAAGAACATGATACCGTGGCCAGCCAGTGACAGAAAAAAGAGTGAA 

AG AAGAAGAGCAATGAG ACAC^GTCTTTCA^CTT CA.TCCGTGTCCTCGTTT CTTACAATGTCACCCATCTCTACA 

CCTGCGGGACCTITCGCCTTCAGCCCTGCTTGTACCTTCATTGAACITCAA 

AG^ACAAGGTCATGGAGG<3AAAAGGCCAAAGCCCCTTTGACCCC 

GGATGCTCTATTCTGGTACTATGAACAACTTCCTGGGCAGTGAGCCCATCCTGATGCGCAC^ 
CTGTCCTCAAGACCGAC^CTTCCTCCGCTGGCTGCATCATGACGCCTCCTTTGTGGCAGC 
AGGTCGTCTACTTCTTCTTCGAGGAGACAGCCAGCGAGTTTGACTT^ 
CTAGAGTCTGCAAGAATGACGTGGGCGGCGAAAAGCrrGCTGCAGAAGA^^ 

TGCTCTGCACCCAGCCGCGGCAGCTGCCCTTCAACGTCATCCGCCACGCGGTCCTGCTCCCCGCCGATTCTCCCA 

CAGCTCCCCACATCTACGCAGTCTTCACCTCCCAGTG<3C^^ 

TCTCTCTCTTGGACATTGAACGTCTCTTTAAGGGGAAATACAAA 

CTTATAGGGGCCCTGAGACCAAC CCC CGGCCAGGCAGTTGCTCAGTGGGCCC CTCCTCTGATAAGGCCCTGACCT 

TCATGAAGGACCATTTCCTGATGGATGAGCAAGTGGTGGGGACGCCCCTGCTGGTGA^ 

CACGGCTTGCAGTGGAGACAGGCCAGGGCCTTGATGGGCAG&GCGATCTTGTC 

GGTCGCTCCACAAGGCTGTGCTAAGTGGGGACAGCAGTGCTCATCTGGTGGAAGAGATTCAGCTGTTCCCTGACC 
CTGAACC TGTTCGCAACCTGCAGCTGGCCCCCACCCAGG GTGCAGTGTTTGTAGGCTTCTCAGGAGGTGTCTGGA 
GGGTGCCCCGAGCCAACTGTAGTGTCTATGAGAGCTGTGTGGACTGTGTCCTTGCCCGGGACCCCCACTGTGCCT 
GGGACCCTGAGTCCCGAACCTGTTGCCTCCTGTCTGCCCCCAACCTGAACTCCTGGAAGCAGGACATGGAGCGGG 
GGAACCCAGAGTGGGCATGTGCCAGTGGCCCCATGAGCAGGAGCCTTCGGCCTCAGAGCCGCCCGCAAATCATTA 
AAGAAGTCCTGGCTGTCCCCAACTCCAT CCTGGAGCTCCCCTGCCC CCACCTGTCAG CCTTGGC CTCTTATTATT 
GGAGTCATGGCCCAGCAGCAGTCCCAGAAGCCTCTTCCACTGTCTACAATGGCTCCCTC 

ATGGAGTTGGGGGTCTCTAC CAGTG OTGGGCAACTGAGAATGGCTTTTCATACCCTGTGATCTCCTACTGGGTGG 

ACAGCCAGGACCAGACCCTGGCCCTGGATCCTGAACTGGCAGGCATCCCCCGGGAGCATGTGAAGGTCCCGTTGA 

CCAGGGTCAGTGGTGGGGCCGCCCTGGOTGCCCAGCAGTGCTACTGGCCCCACTTTGTCACTGTCACTGTCCT 

TTGCCTTAGTGCTTTCAG<^GCCCTCATCATCCTCGTGGCCTCCCCATTGAGAGCACTCCGGGCTCGGGG<MGG 

TTCAGGGCTGTGAGACCCTGCGCCCTGGGGAGAAGGCCCCGTTAAGC^AGAGCAACACCTCCAGTCTCCCAAGG 

AATGCAGGACCTCTGCCAGTGATGTGGACGCTGACAACAACTGCCTAGGC^ 

CAGGCCGGGGCTGCGGTGCAGGCACCTGG CCATGCTGGCTGGGCGGC CCAAGGACAGCCCTGACTAGG ATGACAG 
CAGCACAAAAGACCACCTTTCTCCCCTGAGAGGAGCTTCTGCTACTCTGCATCACTGATGACACTCAGCAGGGTG 

CCCCAGACCTGCTCCTACACTGATATTGAAGAACCTGGAGAGGATCCTTC^GTTCTGGGCATTCCAGGGACCCTC 
CAGAAACACAGTGTTTCAAGAGACCCTAAAAAACCTG CCTGTC CCAGGACCCTATGGTAATGAACACCAAACATC 
TAAACAATCATATGCTAACATGCCACTCCTGGAAACTCCACTCTGAAGCTC^ 

TCTC GCAGOTTCATGCAGGG ATCTGCTCCCTCCTGCTT CCCTTACCAGTCGTGCACCG CTGACTCCCAGGAAGTC 
TTTCCTGAAGTCTGACCACCTTTCTTCTTGCTTCAGTTGGGGCAGACTCTGATCCCT^ 

CAGGGGTAATCTGAGCGTTCTTCACTCCTTTACCCTAGCTGACCCCTTCACCTCTCCCCCTCCCTTTTCCTTTGT 
TTTGGGATTCAGAAAACTGCTTGTCAGAGACTGTTTATTTTTTATTAAAAATATAAGGC^ 
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FIGURE 158 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA71166 
xsubunit 1 of 1, 761 aa, 1 stop 
><MW: 83574, pi: 6.78, NX(S/T): 4 

MALPALGLDPWSLLGLFLFQLLQLLLPTTTAGGGGQGPMPRVRYYAGDERRALSFFHQKGLQ 
DFDTLLLSGDGOTLYVGAREAILALDIQDPGVPRLKNMIPWPASDRKKSECAFKKKSNETQC 
FNFIRVLVSYNVTHLYTCGTFAFSPACTFIELQDSYLLPISEDKVMEGKGQSPFDPAHKHTA 
VLVDGMLYSGTMNNFLGSEPILMRTLGSQPVLKTDNFLRWLHHDASFVAAIPSTQVVYFFFE 
ETASEFDFFERLHTSRVARVCKNDVGGEKLLQKKWTTFLKAQLLCTQPGQLPFNVIRHAVLL 
PADSPTAPHIYAVFTSQWQVGGTRSSAVCAFSLLDIERVFKGKYKELNKETSRWTTYRGPET 
NPRPGSCSVGPSSDKALTFMKDHFLMDEQWGTPLLVKSGVEYTRLAVETAQGLpGHSHLVM 
YLGTTTGSLHKAWSGDSSAHLVEEIQLFPDPEPVRNLQLAPTQGAVFVGFSGGVWRVPRAN 
CSVYESC^CVIJ^DPHCAWDPESRTCCLLSAPNI^SWKQDMERGNPEWACASGPMSRSLRP 
QSRPQIIKEVLAVPNSILELPCPHLSALASYYWSHGPAAVPEASSTVYNGSLLLIVQDGVGG 
L YQCWATENGFS Y P V I S YWVDS QDQTLALD P E LAG I P REH VKVP LTR VS GGAALAAQQ S YWP 

HFVTVTVLFALVLSGALIILVASPLRALRARGKVQGCETLRPGEKAPLSREQHLQSPKECR 
SASDVDADNNCLGTEVA 

Signal peptide: 

amino acids 1-30 

Transmembrane domains: 

amino acids 136-156, 222-247, 474-490, 685-704 
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FIGURE 159 

AGGGTCCCTTAGCCGGGCGCAGGGCGCGCAGCCCAGGCTGAGATCCGCGGCTTCCGTAGAAG 
TGAGCA^CTGGGCAGCGAGTGCTTCTTCTAGTGGGCTTCCTTCTCCCTGGGGTCCTGCTC 
TCAG AGGCTGC CAAAAT C CTGACAAT AT CT AC AGTAGGTG GAAG CC ATTATCTACTG ATGGA 
CCGGGTTTCTCAGATT CTTCAAGATC ACGGTC ATAATGTC AC CATG CTTAACCACAAAAGAG 
GTCCTTTTATGC CAGATTTTAAAAAGGAAGAAAAATCATATCAAG TTATCAGTTGG CTTGCA 
CCTGAAGAT CATCAAAGAGAAT TT AAAAAGAGTTTTGATTTCTTTCTGGAAGAAACTTTAGG 
TGGCAGAGGAAAATTTGAAAACTTATTAAATGTTCTAGAATACTTGGCGTTGCAGTGCAGTC 
ATTTTTTAAAT AG AAAGG ATATCATGGATT C C TTAAAG AATGAG AACTT CGACATGGTGATA 
GTTGAAACT TTTG A CTACTG T C CTTT CCTG ATTGCTG AGAAGCTTGGGAAG CCATTTGTGGC 
CATTCTTTCC^CTTCATTCGGCTCTTTGGAATTTGGGCTACCAATCCCCTTGTCrTATGTTC 
»GTATTCCGTTCCTTGCTGACTGATCACATGGACTTCTGGGGCCGAGTGAAGAATTTTCTG 
ATGTTCTTTAGTTTCTGCAGGAGGCAACAGCACATGC^GTCTACATTTGACAACACCATCAA 
GGAACATTTCACAGAAGGCTCTAGGCCAGTTTTGTCTCATCTTCTACTGAAAGCAGAGTTGT 
GGTTCATTAACTCTGACTTTGCCTTTGATTTTGCTCGACCTCTGCTTCCCAACACTGTTTAT 
GTTGGAGGCTTGATGGAAAAACCTATTAAACCAGTACCACAAGACTTGGAGAACtTCATTGC 
CAAGTTTGGGGACTCTGGTTTTGTCCTTGTGACCTTGGGCTCCATGGTGAACACCTGTCAGA 
AT CCGG AAATCTT CAAGGAGATGAACAATGC CTTTG CTCACC TACC C CAAGGGGTG ATATGG 
AAGTGTCAGTGTTCTCATTGGCCCAAAGATGTCCACCTGGCTGCAAATGTGAAAATTGTGGA 
CTGGCTTCCTCAGAGTGACCTCCTGGCTCACCCAAGCATCCGTCTGTTTGTCACCCACGGCG 
GG CAG AAT AGCAT AATGGAGGC CAT C CAGCATGGTG TGCC CATGGTGGGGAT CCCT CT CTTT 
GGAGACCAGCCTGAAAACATGGT C CGAGTAGAAG CC AAAAAGTTTG G TGTTT CT ATT CAGTT 
AAAGAAG C T CAAGG CAGAGA CATT GGCT C T T AAGATGAAA CAAA T CATGG AAGA CAAGAGAT 
ACAAGTCCGCGGCAGTGGCTGCCAGTGTCATCCTGCGCTCCCACCCGCTCAGCCCCACACAG 
CGGCTGGTGGGCTGGATTGACCACGTCCTCCAGACAGGGGGCGCGACGCACCTCAAGCCCTA 
TGTCTTTCAGC^GCCCTGGCATGAGCAGTACCTGTTCGACGTTTTTGTGTTTCTGCTGGGGC 
TCACTCTGGGGACTCTATGGCTTTGTGGGAAGCTGCTGGGCATGGCTGTCTGGTGGCTGCGT 
GGGGCC AGAAAGGTGAAG GAGACATAAGG C CAGGTGC AG CCTTGGCGGGGT CTGTTTGG TGG 
GCGATGTCACCATTTCTAGGGAGCTTCCCACTAGTTCTGGCAGCCCCATTCTCTAGTCCTTC 
TAGTTATCTCCTGTTTTCTTGAAGAACAGGAAAAATGGCCAAAAATCATCCTTTCCACTTGC 
TAATTTTG CT ACAAATTCATC C TTACTAGCTC CTGCCTG CTAGCAGAAATCTTTCCAGTC CT 
CTTGTCCTCCTTTGTTTGCCATC^GCAAGGGCTATGCTGTGATTCTGTCTCTGAGTGACTTG 
GACC^CTGACCCTCAGATTTCCAGCCTTAAAATCCACCTTCCrrTCTCATGCGCCTCTCC^ 
TCACACCCTGACTCTTCCAGCCTCCATGTCC^GACCTAGTCAGCCTCTCTCACTCCTGCCCC 
TACTATCTAT CATGGAAT AACATCCAAGAAAGAC AC CT TG CATATT CTTTCAGTTT CTGTTT 
TGTTCTC C CACATATTCTCTTCAATG CTCAGGAAGC CT GC CCTGTG CTTGAGAGTT CAGGGC 
CGGACACAGGCTCACAGGTCTCCACATTGGGTCCCTGTCTCTGGTGCCCACAGTGAGCTCCT 
TCTTGGCTGAG CAGGCATGG AGACTGTAGG TTTC CAGATTT C CTGAAAAATAAAAGTTTACA 
GCGTTATCTCTCCCCAACCTCACTAA 
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FIGURE 160 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA71169 
xsubunit 1 of 1, 523 aa, 1 stop 
><MW; 59581, pi: 8.68, NX(S/T): 1 

MAGQRVLLLVGFLLPGVLLSEAAKILTISTVGGSHYLLMDRVSQILQDHGHNVTMLNHKRGP 
FMPDFKKEEKSYQVISWIJVPEDHQREFKKSFDFFLEETLGGRGKFENLLNVLEYLALQCSHF 
LNRKDIMDSLKNENFDMVIVETFDYCPFLIAEKLGKPFVAILSTSFGSLEFGLPIPLSYVPV 
FRSLLTDHMDFWGRVKNFIjyiFFSFCRRQQHMQSTFDNTIKEHFTEGSRPVLSHLLLKAELWF 
INSDFAFDFARPLLPNTVYVGGLMEKPIKPVPQDLENFIAKFGDSGFVLVTLGSMVNTCQNP 
EIFKEMNNAFAHLPQGVIWKCQCSHWPXDVHLAANVKIVDWLPQSDLLAHPSIRLFVTHGGQ 
NSIMEAIQHGVPIWGIPLFGDQPENMVRVEAKKFGVSIQLKKLKAETLALKMKQJMEDKRYK 
SAAVAASVILRSHPLSPTQRLVGWIDHVLQTGGATHLKPYVFQQPWHEQYLFDVFVFLLGLT 
LGTLWLCGKLLGMAVWWLRGARKVKET 

Signal peptide: 

amino acids 1-19 

Transmembrane domain: 

amino acids 483-504 
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FIGURE 161 

GGGCTGTTGATTTGTGGGGGATTTTGAAGAGAGGAGGAATAGGAGGAAGGGGTTGAGGGGCT 
G CCTCTGGCATATGCA CACACTCACACATT CTGT CACACC CGTC ACACACAC ATAC CATGTT 
CTCCATCCCCCCAGGTCCAGCCCTCAGTGCTGTCCCATCCAGCAGGGCTACCCTGAAGCTCT 
GGCTGCAGCCCTCCCGTCCAGTGGGCAGGCGGCTTCATCCCTCCTTTCTCTCCCAAAGCCCA 
ACTG CTG T CACT GC ATGC T CTG CCAAGGAGGAGGGAAC TGCAGTGACAG C AGGAGTAAGAGT 
GGGAGGCAGGACAG AG CTGGGA CACAGGTATGGAGAGGGGG TTCAGCGAGC CTAGAGAGGGC 
AGACTAT CAGGGTG CCGGCG GT GAGAAT CCAGGG AGAGGAGCGGAAACAGAAGAGGGGCAGA 
AGACCGGGGCACTTGTGGGTTGCAGAGCCCCTCAGCCATGTTGGGAGCCAAGCCACACrGGC 
TACCAGGTCCCCTACACAGTCCCGGGCTGCCCTTGGTTCTGGTGCTTCTGGCCCTGGGGGCC 
GGGTGGGCCCAGGAGGGGTCAGAGCCCGTCCTGCTGGAGGGGGAGTGCCTGGTGGTCTGTGA 
GCCTGGCCGAGCTGCTGCAGGGGGGCCCGGGGGAGCAGCCCTGGGAGAGGCACCCCCTGGGC 
GAGTGGCATTTGCTGCGGTCCGAAGCCACCACCATGAGCCAGCAGGGGAAACCGGCAATGGC 
AC CAGTGGGG CCAT CTACTT CGAC CAGGTCCTGGTGAACGAGGGCGGTGGCTTT GACC GGG C 
CTCTGGCTCCTTCGTAGCCCCTGTCCGGGGTGTCTACAGCTTCCGGTTCCATGTGGTGAAGG 
TGTACAACCGCCAAACTGTCCAGGTGAGCCTGATGCTGAACACGTGGCCTGTCA'TCTCAGCC 
TTTGCCAATGATCCTGACGTGACCCGGGAGGCAGCCACCAGCTCTGTGCTACTGCCCTTGGA 
CCCTGGGGACCGAGTGTCTCTGCGCCTGCGTCGGGGGAATCTACTGGGTGGTTGGAAATACT 
CAAGTTTCTCTGGCTTCCTCATCTTCCCTCTCT 

CC AGCC C CTGACAACTTT CTTCTG CCCTCTCTTG C C CC AG AAAC AG CAGAGG CAGGAGAGAG 
ACTCCCTCTGGCTCCTATCCCACCTCTTTGCATGGGACCCTGTGCCAAACACCCAAGTTTAA 
GAGAAGAGTAGAGCTGTGGCATCTCCAGACCAGGCCTTTCCACCCACCCACCCCCAGTTACC 
CTCCCAGCCACCTGCTGCATCTGTTCCTGCCTGCAGCCCTAGGATCAGGGCAAGGTTTGGCA 
AGAAGGAAGATCTGCACTACTTTGCGGCCTCTGCTCCTCCGGTTCCCCCACCCCAGCTTCCT 
GCTCAATGCTGATCAGGGACAGGTGGCGCAGGTGAGCCTGACAGGCCCCCACAGGAGCCCAG 
ATGGACAAGCCTCAGCGTACCCTGCAGGCTTCTTCCTGTGAGGAAAGCCAGCATCACGGATC 
TCAGCCAG CACCGTCAGAAG CTGAGC CAGCAC CGTATG GG CTAGGGTGGGAGGCT CAG CCAC 
AGGCAGAAGGGTGGGAAGGGCCTGGAGTCTGTGGCTGGTGAGGAAGGAAGGAGGGTGTATTG 
TC TAGACTGAAC ATGGT A CACATTCTGCATGT ATAG CAGAGCAGCCAGCAGGTAG CAATC CT 
GGCTGTCCTTCTATGCTGGATCCCAGATGGACTCTGGCCCTTACCTCCCCACCTGAGATTAG 
GGTG AGTGTGTTTG CT CTGG CT GAG AGCAGAGCTGAGAGCAG GTAT ACAGAG CT GGAAGTGG 
ACCATGGAAAACATCGATAACCATGCATCCTCTTGCTTGGCCACCTCCTGAAACTGCTCCAC 
CTTTGAAGTTTGAACTTTAGTCCCTCCACACTCTGACTGCTGCCTCCTTCCTCCCAGCTCTC 
TCACTGAGTTATCTTCACTGTACCTGTTCCAGCATATCCCCACTATCTCTCTTTCTCCTGAT 
CTGTGCTGTCTTATTCTCCTCCTTAGGCTTCCTATTACCTGGGATTCCATGATTCATTCCTT 
CAGACCCTCTCCTGCCAGTATGCTAAACCCTCCCTCTCTCTTTCTTATCCCGCTGTCCCATT 
GG C C C AG CCTGGATGAAT CTATC AATAAAACAACTAGAGAATGGTGGT CAGTGAGACACT AT 
AGAATTACTAAGGAGAAGATGCCTCTGGAGTTTGGATCGGGTGTTACAGGTACAAGTAGGTA 
TGTTGCAGAGGAAAATAAATATCAAACTGTATACTAAAATTAAAAA 
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FIGURE 162 

></usr/seqdb2/sst/DNA/Dnaaeqs.min/ss.DNA71180 
xsubunit 1 of 1, 205 aa, i stop 
><MW: 21521, pi; 7.07, NX(S/T): 1 

MLGAKPHWLPGPLHSPGLPLVLVLLALGAGWAQEGSEPVLLEGECLVVCEPGRAAAGGPGGA 
ALGEAPPGRVAFAAVRSHHHEPAGETGNGTSGAIYFDQVLVNEGGGFDRASGSFVAPVRGVY 
SFRFHVVKVYNRQTVQVSLMLNTWPVISAFANDPDVTREAATSSVLLPLDPGDRV 
NLLGGWKYSSFSGFLIFPL 

Signal peptide: 

amino acids 1-32 
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FIGURE 1 63 

GCTGTTTCTCTCGCGCCACCACTGGCCGCCGGCCGCAGCTCCAGGTGTCCTAGCCGCCCAGC 
CTCGACGCCGTCCCGGGACCCCTGTGCTCTGCGCGAAGCCCTGGCCCCGGGGGCCGGGGCAT 
GGGCCAGGGGCGCGGGGTGAAGCGGCTTCCCGCGGGGCCGTGACTGGGCGGGCTTCAGCCAT 
GAAGACCCTCATAGCCGCCTACTCCGGGGTCCTGCGCGGCGAGCGTCAGGCCGAGGCTGACC 
GGAGCCAGCGCTCTCACGGAGGACCTGCGCTGTCGCGCGAGGGGTCTGGGAGATGGGGCACT 
GG ATCCAG CATC CTCT C CG C C CTCCAGG AC CT CTT CT CTGT CACCTGG CT CAAT AGGTCCAA 

GGTGGAAAAGCAGCTACAGGTCATCTCAGTGCTCCAGTGGGTCCTGTCCTTCCTTGTACTGG 

GAGTGGCCTGCAGTGCCATCCTCATGTACATATTCTGCACTGATTGCTGGCTCATCGCTGTG 

CTCTACTTCACTTGGCTGGTGTTTGACTGGAACACACCCAAGAAAGGTGGCAGGAGGTCACA 

GTGGGTCCGAAACTGGGCTGTGTGGCGCTACTTTCGAGACTACTTTCCCATCCAGCTGGTGA 

AG AC ACAC AACCTG CT GAC CACCAGG AACT ATAT CTTTGGATAC CACC CCCATG GT AT CATG 

GG CCTGGGTG CCT T CT GCAACTT C AGCACAG AGG C CACAGAAGTGAG C AAGAAGTT CC C AGG 

CATACGGCCTTACCTGGCTACACTGGCAGGCAACTTCCGAATGCCTGTGTTGAGGGAGTACC 

TGATGTCTGGAGGTATCTGCCCTGTCAGCCGGGACACCATAGACTAITTGCTTTCAAAGAAT 

GGGAGTGGCAATGCTATCATCATCGTGGTCGGGGGTGCGGCTGAGTCTCTGAGCTCCATGCC 

TGGCAAGAATGC^GTCACCCTGCGGAACCGCAAGGGCTTTGTGAAACTGGCCCTGCGTCATG 

GAGCTGACC TGGTT C CCAT C T ACTC CTTTGGAGAGAATGAAGTGTACAAG CAGGTGATCTTC 

GAGGAGGGCTCCTGGGGCCGATGGGTCCAGAAGAAGTTCCAGAAATACATTGGTTTCGCCCC 

ATGCATCTTCCATGGTCGAGGCCTCTTCTCCTCCGACACCTGGGGGCTGGTGCCCTACTCCA 

AGCCCATCACCACTGTTGTGGGAGAGCCCATCACCATCCCCAAGCTGGAGCACCCAACCCAG 

CAAGA^TCGACCTGTACCACACCATGTACATGGAGGCCCTGGTGAAGCTCTTCGACAAGCA 

CAAGAC CAAGTT CG GC CT CC CGGAGACTGAGGTC C TGG AGGTGAAC JGAGCCAG CCTT CGGG 

GCCAATTCCCTGGAGGAACCAGCTGCAAATCACTTTTTTGCTCTGTAAATTTGGAAGTGTCA 

TGGGTGTCTGTGGGTTATTTAAAAGAAATTATAACAATTTTGCTAAACCAAAAAAAAAAAAA 

^^^^^^^ 

AAAAAAAAAAAAAAAAAAAA 
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FIGURE W 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA7H84 
xsubunit 1 of 1, 388 aa, 1 stop 
><MW: 43831, pi: 9.64, NX(S/T): 3 

MKTLIAAYSGVLRGERQAEADRSQRSHGGPALSREGSGRWGTGSSILSALQDLFSVTWLNRS 
KVEKQLQVISVLQWVLSFLVLGVACSAILMYIFCTDCV^IAVLYFTWLVFDWNTPKKGGRRS 
QWVRNWAVWRYFRDYFPIQLVKTHNLLTTRNYIFGYHPHGIMGLGAFCNFSTEA 
GIRPYLATLAGNFRMPVLREYLMSGGICPVSRDTIDYLLSKNGSGNAI I IWGGAAESLSSM 
PGKNAVTLRNRKGFVKLALRHGADLVPIYSFGENEVYKQVIFEEGSWGRWVQKKFQKYIGFA 

PCIFHGRGLFSSDTWGLVPYSKPITTVVGEPITIPKLEHPTQQDIDLYHTMYMEALVKLFDK 
HKTKFGLPETEVLEVN 

Important features of the protein: 
Transmembrane domain: 

amino acids 76-97 

N-glycosylation sites. 

amino acids 60-63, 173-176, 228-231 

N-myrietoylation sites. 

amino acids 10-15, 41-46, 84-89, 120-125, 169-174, 229-234, 240- 
245, 318-323, 378-383 
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FIGURE 165 



GGGCGGCGGGATGGGGGCCGOGGGCGGCGGGCGCCGCACTCGCTGAGGCCCCGACGCAGGGCCGGGCCGGGCCCA 
GGGCCGAGGAGCGCGG CGGCCAGAGCGGGG CCGCGGAGGCGACGCCGGGGACGCCCGCGCGACGAGCAGGTGGCG 
GCGGCTGCAGGCTTGTCCAGCCGGAAGCCCTGAGGGCAGCTGTTCCCACTGGCTCTGCTGACCTTGTGCCTTGGA 
CGGCTGTCCTCAGCGAGGGGCCGTGCACCCGCTCCTGAGCAGCGCCATGGGCCTGCTGGCCCT 
GTTCGTGCTGCACCTGCTGGTCGGCTTTGTCTTCGTGGTGAGTGGTCTGGTCATCAACTTCGTCCAGCTGTGCAC 
GGTGGCGCTCTGGCCGGTCAGCAAGCAGCT CTACCGCCGCCTCAACTGCCG CC TCGC CTACTCACTCTGGAGCCA 
AC TGGT CATGCTGCTGGAGTGGTGGTCCTG CACGGAGTGTACACTGTTCACGGACCAGGCCACGGTAGAGCGCTT 



GCGCTTTOGAGTGCTGGGGAGCTCCAAGGTCCTCGCTAAGAAGGAGCTGCTCTA 
GTGGTACTTTCTGGAGATTGTGTTCTGCAAGCGGAAGTGGGAGGAGGACCGGGACACCGTGGT 
GCGCCTGTCGGACTACCCCGAGTACATGTGGTTTCTCCTGTACTGCGAGGGGACGCGCTTCACGGAGACCAAGCA 
CCGCGTTAGCATGGAGGTGGCGGCTGCTAAGGGGCTTCCTGTCCTCAAGTACCACCTGCTGC 
CTTCACCACCGCAGTCAAGTGCCTCCGGGGGACAGTCGCAGCTGTCTATGATGTAACCCTGAACTTCAGAGGAAA 
CAAGAACCCGTCCCTGCTGGGGATCCTCTACGGGAAGAAGTACGAGGCGC^ 

GGAAGACATCCCGCTGGATGAAAAGGAAGCAGCTCAGTGGCTTCATAAACTGTACCAGGAGAAGGACGCGCTCC^ 
GGAGATATATAATCAGAAGGGCATGTTTCCAGGGGAGCAGTTTAAGCCTGCCCGGAGGCCGTGGACCCTCCTGAA 



TCTCCTGATCCTGACTTTClTGGG^TTTGTGGGAGCAGCTTCCm 
TGAACCTGGGAGGTGGAGATTGCAGTG^GCTGAGATGGCATC^CTGTACTCCAGCCTAGGCAACA^ 
CAGTCTCAAAAAAAAAAAAAAACAAAAAAAC CCCAGAAATTCTGG^ 

ATTCACTAGAGGCTGAACAGCAGATTTGAGCAGGCAGAAAAAAATC^GCAAGCTTGAAGATGGTACCTTGAGATT 
TTTCAGGCTAATGAAAAAAGAATGAAGGAAAATTAACAGCCTCAGAGACCCATGGT 

CATATGCATGATGAGAGTC C CAG AAGGAGAGGAGAGAAAGGGTC AGAAAG AATG GC CACAAG CTGATGAAAAACA 
GT AACCTACC CACTCAGGAAGCTCAGTGAACTC CAATGAGGATGAATATCAG AGATCCAC ACCTAGATATTTCAT 
AATCAAAG TG TCAAATGACAAAGAAT C T TGAAAG CAGCAAG AGATGAGCAACTTAT CTTG TTCAAAG GATC TTTG 
ATCAGATTAACAGCTCATTTCTCCTaVGAAATCATGGGAGCCAGGAGATAGTGGGAT 
AACCTTCAACTGTAATTATTGGACTTTTGAGTCTTAGATGGT 

ATTTAATC CCTAATAAGAATT AGT C AAG C T7 C CTTGAC CTGTAGG AAGG C CTGTCTTTAG GC CGGG CACAGTGGC 

TTACACCTGTAATCCCAGC^CTTTGGGAGGCCCAGACGGGTGGATCATTTGGGGTCA^ 

GAGT TCAG GTGATCTGCCCGCCTCAGCCTTCCCAAAGTGTTGTGATTGCAGGCGTO 

atttctttttaaggctgaatgatgggg<k:caggcacgatggot 
aacatgcaccaccatgcctggctaatttttgtatttttagtagm 

GACCTCAAGTGACCACCTGCCTCAGCCTCCCAAAGTAC^ 

G ^ TCTTCTGATGTGC ^ AT, ^ C ^ T ^^ 

CCTTTTTAAATTTTTATTATTTATTTATTTATTTATTTTC^GACAGGG 
CAGTGCCACAGTCTTGGCTCACTGCAGCCTCGACCTCCTG^ 
AGCTGTATTTTTTTGTATTTTGTATTTTCTAGCTGTA 
TGCECAGGCTGGTCTTCaA^ 

CATGAGCCACTGCA CCTGG CAAACTCCCAAAATTCAACACACACIACACAAAAAACC ACCTG ATTCAAAATGGG 

GAGGGGCCGGGTGTGGCCCCAACTACCAGGGAGACTGAAGTGGGAGGATCGCTTGGGCATGAGAAGTC 

CAGTGAGTCGAGGTTGTGCGACTGCATTCCAGCCTGGACAACAGAGTGAGACCCTGTCTC 




kTGTGTGA 
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FIGURE 166 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA712l3 
xsubunit 1 of 1, 368 aa, 1 stop 
><MW: 42550, pi: 9.11, NX(S/T): 1 

MGLLAFLKTQFVLHLLVGFVFWSGLVINFVQLCTLALWPVSKQLYRRLNOT 

MLLEWWSCTECTLFTDQATVERFGKEHAVIILNHNFEIDFLCGWTMCERFGVLGSSKVLAKK 

ELLYVPLIGWTVryFLEIVFCKRKWEEDRDTVVEGLRRLSDYPEYMWFLLYCEGTRFTETKTO 

VSMEVAAAKGLPVLKYHLLPRTKGFTTAVKCLRGTVAAVYDVTLNFRGNKNPSLLGILYGKK 

YEADMCWRFPLEDIPLDEKEAAQWLHKLYQEKDALQEIYNQKGMFPGEQFKPARRPWTLLN 

FL S WAT I LL S PLFS F VLGVF AS G S P LL I LTFLG FVGAAS FGVRRL I GES LE PGRWRLQ 

Important features of the protein: 
Signal peptide: 

amino acids 1-25 

Transmembrane domains: 

amino acids 307-323, 335-352 

Tyrosine kinase phosphorylation sites. 

amino acids 160-168, 161-169 



WO 00/12708 



PCT/US99/20I11 



FIGURE 167 

GATATTCTTTATTTTTAAGAATCTGAAGTACTATGCATCACT C C CTCCAATGT C CTGGG GCA 

GCCACCAGGCATATTCATCTTTGTGTGTGTTTTTCTTTTGCTTTAGCACTGGGGCACTTCTT 

GCTTATTT CTTTGGTAGGAAAGGGGCTCAGTTTGTCTTGTGGGGTTGGTGGCAGGCAGG CCG 

G CTT ACGC CTGATACGG CCCTGGGTTAGAAGGGAAGGG AAGATAAACT TTT ATACAAATGGG 

GATAGCTGGGGTCTGAGACCTGCTTCCTCAGTAAAATTCCTGGGATCTGCCTATACCTTCTT 

TTCTCTAACCTGGCATACCCTGCTTAAAGCCTCTCAGGGCTTCTCTCTGTTCTTAGGATCAA 

AGTATTTAGAGCTACAAGAGCCCTCATGGTCTGGCCCCTGCCCCCCTGGCCAGCTTCATTGT 

ACATGTGGTGTTCTCTTGTCGTTCCTGTAATGTGGTATGCCATGGGGTCTTTGCACAAGCCT 

TTCCTCTTTGGCTGGACACTGTTCCCTGCCCCCCCCATACTCTTCCTACTTAATATGTAGTC 

ATCCTGCAGATTTCAATTCTAACATCATTTTCTCCAGGGATCCTGGCCTGACAGAATCTCAT 

CTTGTTTAATGCTCTCATAAGACCACTTGTTTCCCTTTTGCAGCACTTGCCACTCAGTTGTA 

TCTTTATGTGCGTTTGTGGTTGTATGGGTTGTGTCTGTTCCCCAGAATGCCCAGCTCTGAGC 

TGCGTGAGGGTCAAGGGCATTGCTGTGCCTGCCAGGTATAGTGCCTACATGTGGTGGGTGCT 

CATGTTTTAGAGACTAAATGGAGGAGGAGATGAGGAAAAGATTGAAATCTCTCAGTTCACCA 

GATGGTGTAGGGCCCAGCATTGTAAATTCACACGTTGACTGTGCTTGTGAATTATCTGGGGA 

TGCAGGT CCTGATT CAGTAGGCCCAGGTTGGGCATCTCTAACAAACTCCCACGTGATG CTGA 

TGCTGGTCCTATGAACTATACTAAATAGTAAGAATCTATGGAGCCAGGCTGGGCATGGTGGC 

TCACACCTATGATCCCAGCACTTTGGGAGGCTGAGGCAGGCTGATCACCTGGAGTCAGGATT 

TCAAGACTAGCCTGGCCAACATGGTGGAACCCCATCTGTACTAAAAATACACAAATTAGCTG 

GGCATGGTGGCACATGCCTGTAGTCCCAGCTACTTGGGAGGCTGAAGCAAGAGAATCGCTTG 

AACCTGGGAGGCGGAGGTTGCAGTGAGCCGAGATCAGGC CACTGTATTC CAACCAGGGTGAC 

AGAGTGAGACT CT ATGTCCAAAAAAAAAAAAA 
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FIGURE Ififl 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA71234 
xsubunit 1 of 1, 143 aa, 1 stop 
><MW: 15624, pi: 9.58, NX(S/T): 0 

MHHSLQCPGAATRHIHLCVCFS FAIALGHFLL IS LVGKGLSLSCGVGGRQAGLRLIRPWVRR 

EGKINFYTNGDSWGLRPASSVKFLGSAYTFFSLTWHTLLKASQGFSLFLGSKYLELQEPSWS 
GPCPPGQLHCTCGVLLSFL 

Important features of the protein: 
Signal peptide: 

amino acids 1-28 



J 70 'Z70 
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FIGURE 169 

GGCTGGACTGGAACTCCTGGTCCCAAGTGATCCACCCGCCTCAGCCTCCCAAGGTGCTGTGA 
TTATAGGTGTAAGCCACCGTGTCTGGCCTCTGAACAACTTTTTCAGCAACTAAAAAAGCCAC 
AGGAGTTGAACTGCTAGGATTCTGACTASGCTGTGGTGGCTAGTGCTCCTACTCCTACCTAC 
ATTAAAATCTGTTTTTTGTT CTCTTGT AAC TAG C CTTTAC CTTC CTAACACAGAGG AT CTGT 
CACTGTGGCTCTGG CCCAAAC CTGAC CTT C ACTCT GG AACGAG AACAGAGG TTT CT AC CCAC 
ACCGTCCCCTCGAAGCCGGGGACAGCCTCACCTTGCTGGCCTCTCGCTGGAGCAGTGCCCTC 
ACCAACTGTCTCACGTCTGGAGGCACTGACTCGGGCAGTGCAGGTAGCTGAGCCTCTTGGTA 
GCTGCGGCTTTCAAGGTGGGCCTTGCCCTGGCCGTAGAAGGGAT^CAAGCCCGAAGATTT 
CATAGGCGATGGCTCCCACTGCCCAGGCATCAGCCTTGCTGTAGTCAATCACTGCCCTGGGG 
CCAGGACGGGCCGTGGACACCTGCTCAGAAGCAGTGGGTGAGACATCACGCTGCCCGCCCAT 
CTAACCTTTTCATGTCCTGCACATCACCTGATCCATGGGCTAATCTGAACTCTGTCCCAAGG 
AACCCAGAGCTTGAGTGAGCTGTGGCTCAGACCCAGAAGGGGTCTGCTTAGACCACCTGGTT 
TATGTGACAGGACTTGCATTCTCCTGGAACATGAGGGAACGCCGGAGGAAAGCAAAGTGGCA 
GGGAAGGAACTTGTG C CAAATTATGG GT CAGAAAAGATGGAGGTGTTGGGTTATCACAAGGC 
ATCGAGTCTCCTGCATTCAGTGGACATGTGGGGGAAGGGCTGCCGATGGCGCAT6ACACACT 
CGGGACTCACCTCTGGGGCCATCAGACAGCCGTTTCCGCCCCGATCCACGTACCAGCTGCTG 
AAGGGC AACTGCAGGC CGATGCTCT CATCAGC CAGGCAGC AG CC AAAAT CTG CGAT CACC AG 
CCAGGGGCAGCCGTCTGGGAAGGAGCAAGCAAAGTGACCATTTCTCCTCCCCTCCTTCCCTC 
TGAGAGGCCCTCCTATGTCCCTACTAAAGCCACCAGCAAGACATAGCTGACAGGGGCTAATG 
GCT C AG TGTTGGC CCAGGAGGTCAG CAAGG CCTG AGAG CTGAT CAG AAGGGCCTGCTGTGCG 
AACACGGAAATGCCTCCAGTAAGC7VCAGGCTGCAAAATCCCCAGGCAAAGGACTGTGTGGCT 
CAATTTAAATCATGTTCTAGTAATTGGAGCTGTC CC CAAG ACCAAAGGAG CTAGAG CTTGGT 
TCAAATGAT CTCCAAGGGC CCTTATACCCCAGGAGACTTTGATTTGAATTTGAAACCCCAAA 
TCCAAACCTAAGAACCAGGTGCATTAAGAATCAGTTATTGCCGGGTGTGGTGGCCTGTAATG 
C CAACATTTTGGGAGG CCGAGG CGGGTAGATCAC CTGAGGTC AGGAGTTCAAGAC CAGCCTG 
GCCAACATGGTGAAACCCCTGTCTCTACTAAAAATACAAAAAAACTAGCCAGGCATGGTGGT 
GTGTGC CT GTAT CCCAG CTACT CGGGAGG C TGAG AC AGGAGAATTACTTGAACCTGGGAGGT 
GAAGGAGG CT GAGACAGG AG AATCACTTCAGC CTGAGC AACACAGCGAGACT CTGT CT CAGA 
AAAAATAAAAAAAGAATTATGGTTATTTGTAA 



/7//J2 76 
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FIGURE 170 

>< /usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA71277 
xsubunit 1 of 1, 109 aa, 1 stop 
><MW: 11822, pi: 8.63, NX(S/T): 0 

MLWWLVLLLLPTLKSVFCSLVTSLYLPNTEDLSLWLWPKPDLHSGTRTEVSTHTVPSKPGTA 
SPCWPLAGAVPSPTVSRLEALTRAVQVAEPLGSCGFQGGPCPGRRRD 

Signal peptide: 

amino acids 1-15 
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FIGURE 171 

GCGGGCCCGCGAGTCCGAGACCTGTCCCAGGAGCTCCAGCTCACGTGACCTGTCACTGCCTC 
CCGCCGCCTCCTGCCCGCGCC^SGACCCAGCCGGTGCCCCGGCTCTCCGTGCCCGCCGCGCT 
GGCCCTGGGCTCAGCCGCACTGGGCGCCGCCTTCGCCACTGGCCTCTTCCTGGGGAGGCGGT 
GCCCCCCATGGCGAGGCCGGCGAGAGCAGTGCCTGCTTCCCCCCGAGGACAGCCGCCTGTGG 
CAGT ATCTT CTG AGCCG C TC CATGCGGGAG CACC CGGCGCTG CGAAG C CTGAGG CTGCTGAC 

CCTGGAGCAGCCGCAGGGGGATTCTATGATGACCTGCGAGCAGGCCCAGCTCTTGGCCAACC 
TGGCGCGGCTCATCCAGGCCAAGAAGGCGCTGGACCTGGGCACCTTCACGGGCTACTCCGCC 
CTGGCCCTGGCCCTGGCGCTGCCCGCGGACGGGCGCGTGGTGACCTGCGAGGTGGACGCGCA 
GCCCCCGGAGCTGGGACGGCCCCTGTGGAGGCAGGCCGAGGCGGAGCACAAGATCGACCTCC 
GGCTGAAGCCCGCCTTGGAGACCCTGGACGAGCTGCTGGCGGCGGGCGAGGCCGGCACCTTC 
GACGTGGCCGTGGTGGATGCGGACAAGGAGAACTGCTCCGCCTACTACGAGCGCTGCCTGCA 
GCTGCTGCGACCCGGAGGCATCCTCGCCGTCCTCAGAGTCCTGTGGCGCGGGAAGGTGCTGC 
AACCTCCGAAAGGGGACGTGGCGGCCGAGTGTGTGCGAAACCTAAACGAACGCATCCGGCGG 
GACGTCAGGGTCTACATCAGCCTCCTGCCCCTGGGGGATGGACTCACCTTGGCCTTCAAGAT 
CTAGGGCTGGCCCCTAGTGAGTGGGCTCGAGGGAGGGTTGCCTGGGAACCCCAGGAATTGAC 
CCTGAGTTTTAAATTCGAAAATAAAGTGGGGCTGGGACACAAAAAAAAAAAAAAAAAAA 



WO 00/12708 
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></usr/seqdb2/sst/DNA/Dnaseqs .min/ss . DNA71282 
xsubunit 1 of 1, 262 aa, 1 stop 
><MW: 28809, pi: 8.80, NX(S/T): 1 

MTQPVPRLSVPAALALGSAALGAAFATGLFLGRRCPPWRGRREQCLLPPEDSRLWQYLLSRS 

MREHPALRSLRLLTLEQPQGDSMMTCEQAQl^ANLARLIQAKKALDLGTFTGYSAL^^ 

PADGRVVTCEVDAQPPELGRPLWRQAEAEHKIDLRLKPALETLDELLAAGEAGTFDVAVVDA 

DKENCSAYYERCLQLLRPGGILAVLRVLWRGKVLQPPKGDVAAECVRNLNERIR^ 

LLPLGDGLTLAFKI 

Important features of the protein: 
Signal peptide: 

amino acids 1-25 

Transmembrane domains: 

amino acids 8-30, 109-130 

N-glycosylation site. 

amino acids 190-193 

Tyrosine kinase phosphorylation site. 

amino acids 238-246 

N-myristoylation sites. 

amino acids 22-27, 28-33, 110-115, 205-210, 255-260 

Amidation sites. 

amino acids 31-34, 39-42 
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FIGURE 173 

CCGCCGCCGCAGCCGCTACCGCCGCTGCAGCCGCTTTCCGCGGCCTGGGCCTCTCGCCGTCA 

GCASSCCACACGCCTTCAAGCCCGGGGACTTGGTGTTCGCTAAGATGAAGGGCTACCCTCAC 

TGGCCTGCCAGGATCGACGACATCGCGGATGGCGCCGTGAAGCCCCCACCCAACAAGTACCC 

CATCTTTTTCTTTGGCACACACGAAACAGCCTTCCTGGGACCCAAGGACCTGTTCCCCTACG 

ACAAATG T AAAGA CAAG T AC GG GAAG CC CAACAAG AGG AAAG G C T T CAAT GAAGGG CTGTGG 

GAGATCCAGAACAACCCC CACG CCAG CTACAG CGCCCCTCCGC CAGTG AGCT C CTCCGACAG 

CGAGGCCCCCGAGGCCAACCCCGCCGACGGCAGTGACGCTGACGAGGACGATGAGGACCGGG 

GGGTCATGGCCGTCACAGCGGTAACCGCCACAGCTGCCAGCGACAGGATGGAGAGCGACTCA 

GACT CAGACAAG AGTAGCGACAAC AGTGGC CTGAAG AGGAAG ACGC CTG CGCT AAAGATGTC 

GGTCTCGAAACGAGCCCGAAAGGCCTCCAGCGACCTGGATCAGGCCAGCGTGTCCCCATCCG 

AAGAGGAG AACTCGGAAAGCTCAT CTGAGT CGGAGAAGACCAGCGACCAGGACTTCACACCT 

GAGAAGAAAGCAGCGGTCCGGGCGCCACGGAGGGGCCCTCTGGGGGGACGGAAAAAAAAGAA 

GGCGCCGTCAGCCTCCGACTCCGACTCCAAGGCCGATTCGGACGGGGCCAAGCCTGAGCCGG 

TGGCCATGGCGCGGTCGGCGTCCTCCTCCTCCTCTTCCTCCTCCTCCTCCGACTCCGATGTG 

TCTGTGAAGAAGCCTC CGAGGGGCAGGAAGCCAGCGGAGAAGCCTCTC CCGAAGCCGCGAGG 

G CGG AAAC CGAAGC CTGAACGGCCTCCGT C C AGCT C CAGCAGTGAC AG TG ACAG CGACGAGG 

TGGACCG CAT CAGTGAGTGGAAGCGG CGGGACGAGG CGCG GAGGCG CG AG CTGGAGGC C CGG 

CGGCGGCGAGAGCAGGAGGAGGAGCTGCGGCGCCTGCGGGAGCAGGAGAAGGAGGAGAAGGA 

GCGGAGGCGCGAGCGGGCCGACCGCGGGGAGGCTGAGCGGGGCAGCGGCGGCAGCAGCGGGG 

ACGAGCTCAGGGAGGACGATGAGCCCGTCAAGAAGCGGGGACGCAAGGGCCGGGGCCGGGGT 

CCCCCGTCCTCCTCTGACTCCGAG CC CGAGGCCGAGCTGGAGAGAGAGGCCAAGAAATCAGC 

GAAGAAGCCG CAGT CCT CAAGCACAGAG CC CG C CAGGAAACCTGGC CAGAAGGAGAAGAGAG 

TGCGGCCCGAGGAGAAGCAACAAG CCAAGCC CGTGAAGGTGGAGCGGACCCGGAAGCGGTCC 

GAGGGCTTCTCGATGGACAGGAAGGTAGAGAAGAAGAAAGAGCCCTCCGTGGAGGAGAAGCT 

GCAGAAGCTG CACAG TGAGAT CAAGTTTGC CCTAAAGGTCGACAGC CCGG ACGTGAAGAGGT 

GCCT GAATG C CC TAGAGGAG CTGGGAAC CCTGCAGGTGACCTCTCAGAT C CTCCAGAAGAAC 

ACAGACGTGGTGGCCACCTTGAAGAAGATTCGCCGTTACAAAGCGAACAAGGACGTAATGGA 

GAAG GCAGCAGAAGT CTATA CC CGGCTC AAGTCG CGGGT CCTCGGCCCAAAGAT CGAGG CGG 

TGCAGAAAGTGAACAAGGCTGGGATGGAGAAGGAGAAGGCCGAGGAGAAGCTGGCCGGGGAG 

GAGCTGGCCGGGGAGGAGGCCCCCCAGGAGAAGGCGGAGGACAAGCCCAGCACCGATCTCTC 

AG CC CCAG TGAATGGCGAGGC CACATCACAGAAGGGGGAG AGCGCAGAGG ACAAGGAG CACG 

AGGAGGGT CGGG ACTCGGAGGAGGGG CCAAGGTGTGGCTC CTCTGAAGAC CTG CACGACAGC 

GTACGGGAGGGTCCCGACCTGGACAGGCCTGGGAGCGACCGGCAGGAGCGCGAGAGGGCACG 

GGGGGACT CGGAGG CCCTGGACGAGGAGAG CTGAG C CG CG GG CAG CCAGG CC CAGC CC CCGC 

CCGAGCTCAGGCTGCCCCTCTCCTTCCCCGGCTCGCAGGAGAGCAGAGCAGAGAACTGTGGG 

GAACGCTGTGCTGTTTGTATTTGTTCCCTTGGGTTTTTTTTTCCTGCCTAATTTCTGTGATT 

TCCAACCAACATGAAATGACTATAAACGGTTTTTTAATGA 



(VP** 



WO 00/12708 FCT/USMOMU 



FIGURE 174 

></usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA71286 
x'subunit 1 of 1, 671 aa, 1 stop 
><MW: 74317, pi: 7.61, NX(S/T): 0 

MPHAFKPGDLVFAKMKGYPHWPARIDDIADGAVKPPPNKYPIFFFGTHETAFLGPKDLFPYD 
KCKDKYGKPNKRKGFNEGLWEIQNNPHASYSAPPPVSSSDSEAPEANPADGSDADEDDEDRG 
VMAVTAVTATAASDRMESDSDSDKSSDNSGLKRKTPALKMSVSKRARKASSDLDQASVSPSE 
EENSESSSESEKTSDQDFTPEKKAAVRAPRRGPLGGRKKKKAPSASDSDSKADSDGAKPEPV 
AMARSASSSSSSSSSSDSDVSVKKPPRGRKPAEKPLPKPRGRKPKPERPPSSSSSDSDSDEV 
DRISEWKRRDEARRRELEARRRREQEEELRRLREQEKEEKERRRERADRGEAERGSGGSSGD 
ELREDDEPVKKRGRKGRGRGPPSSSDSEPEAELEREAKKSAKKPQSSSTEPARKfGQKEKRV 
RP E E KQQ AK P VKVE RTRKRS EG F S MDR KVE KKKE P S VE E KLQ KLHS E I KF ALKVDS PD VKRC 

LNALEELGTLQVTSQILQKIJTDWATLKKIRRYKANKDVMEKAAErVYTRLKSR 

Q KVNKAGMEKE KAEE KLAGE ELAG EE APQ E KAED KP S TDLS AP VNGEATS Q KGES AED KEHE 

EGRDSEEGPRCGSSEDLHDSVREGPDLDRPGSDRQERERARGDSEALDEES 

Signal peptide: 

amino acids 1-13 



pc in* 
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FIGURE 175 

GTTGGTTCTCCTCXiATCTTC^CCTTACCAACT 

ACAC CATT TGAAAGAGAACATTGTTTT C AT CA^AATGCTAAT AAAGATQAAAGACTTJUU^G CC^AAG CCAAGA 
TTTTCACCTTTTTC CTGCTTTGATGATG CTAAGCATG AC CATGTTGTTTCTTCCAGTC^CTGGCACTTTGAAGCA 
AAATATTCCAAGACTCAAGCrAACCTACAAAGACTTGCTGCTTTCAAATAGCTGTAT^ 

CTTTCTACTCAGTCTGGTTGACTTAAACAAAAATTTTAAGAAGATTTATTG 

ATTATGTAAATTAGCTGGGAAAG ATG CCAATACAGAATCTGCAAATTTCATCAGAGTACTT C AGCCCTATAACAA 

AACTCACATATATGTGTGTGGAACTGGAGCATTTCATCCAATATGTGGGTATATTGAT 

GGATATTATATTCAAACTAGACACACATAATTTGGAGTCTGGCAGACTGAAATGTCCTTTCGA 

TTTTG C TT C AGTAATGACAG ATGAGT ACCTCTACT CTGG AACAG CTT C TG ATTTC CTTGGCAAAGAT AC TGCATT 

CACTCGATCCCTTCG^CTACTCATC^ 

AGCAAAATTTATTGGAACTTTCTTCAT^^ 

TGAATCATCTCAAGAAGGCAGTACCTCCGATAAAACCATCCTTTCTCGAGTTGGAAGAGTTTGTAAGA^ 
ACXSAGGACAAraCAGCCTGATAAACAAGTGGACGACTTTTCTTAAGGCCAGAOT 

TGATGGGGC^GATACTTACTTTGATGAGCTTCAAGATATTTATTTACTCCCCACAAGAGATGAAAGAA^ 
AGTAT AT GGAG TCTTTACT ACAAC CAG CTC C ATCTTCAAAGGCTC TG CTG T TTGTG TGT AT AGC ATGGCTGACAT 
CAGAGCAGTTTTTAATGGTCCATATGCTCATAAG<3AAAGTGCAGACCATCGTTGGGTGCAGTATGATGGGA 
TCCTTATCCACGGCCTGGTACATGTC CAAG CAAAAC CTATGACCCACTG ATTAAGTCCACCCGAG ATTTTCCAGA 
TGATGTCATCAGTTTCATAAAGCGGCACTCTGTGATGTATAAGTCCGTATACCCAGTTGCAGGAGGACCAACGT^ 
CAAGAGAATCAATGTGGATTACAGACTGACACAGATAGTGGTGGATCATGTCATTGCAGAAGATGGCCAGTACGA 
TGTAATG TTTC1TGGAACAGACATTGGAACTGTCCTCAAAGTTGT CAGCATTTCAAAGGAAAAGTGGAATATGGA 
AGAGGTAGTGCTGGAGGAGTTGCAGATATTCAAGCACTCATCA^^ 

GCAACAATTGTACATTGGTTCCCGAGATGGATTAGTTCAGCTCTCCTTGCACAGATGCGACACTTATG^ 
TTGCGCAGACTGT^GTCTTGCCAGAGACCCCTACTGTGCCTGGGATGGAAATGCA 

TTCTAAAAGGAGAGCTAGACGC CAAGATGTAAAATATGGCGACCCAATCAC CCAGTGCTGGGACATCGAAGACA3 
CATTAGTGATGAAACTGCTGATGAAAAGGTGATTTTTGGCATTGAATTTAACTC^^ 

T AAATC CCAACAAG CAACTATTAAATGG TAT AT C CAGAGGTCAG GGGATGAG CAT C GAGAGGAGTTGAAGC C CGA 
TGAAAGAATCATCAAAACGG AATATGGG C TACTG ATT CGAAGTTTG CAGAAG AAGG ATT CTGG GATGTATTACTG 
CAAAGCCCAGGAGCACACTTTCATCCACACCATAGTGAAGCTGAC^^ 

AAAT AC C C AGAGG GCAGAG CATGAGGAGGGGCAGGTCAAGGATCTATTC^CTGAGTCACGGTTGAGATACAAAGA 

CTAC^TCCAAATCCTTAGCAGCCCIAAACTTCAGCCTCGACCAGTACTGCGAAJCAGATGTGG 

GAG ACAGAGAAACAAGGGGGGCCCAAAGTGGAAGCACATGCAGGAAATGAAGAAGAAACG AAATC 

CAG AGAC CTG GATG AGCTC C CTAG AGCTGT AG C C ACGTA^TTTTC TACTTAATTT AAAG AAAAGAATTC C TTAC C 

TATAAAAACATTGCCTTCTGTTTTGTATATC CCTT ATAGTAATTCATAAATGCTTC CCATGGAGTTTTGCTAAGG 

CACAAGACAATAATCTGAATAAGA C AATATG TGAT G AATAT AAG AAAGGGCAAAAAATTC ATTTGAAC CAGTTTT 

CCAAGAACAAATCTTGCACAAGCAAAGTATAAGAATTATCCTAAAAATAGCGGGTTTA^ 

TCTTTTGAGTTT^C^AATTTATTGTCATGTAAATAGTTGAGCTAAGCAAGCCC 

GCTTTATTCCCTCGAATGTCCATTAAGCATGGAATTTACCATGC^ 

CATTCCTATTGAGAACCAGCTACCTTGTGGTAGGGAATAAGAGGTCAG^CACAAATTAAGACAACT 

AACAGGAACTTTCTCAGTGAGCCATTCACTCCTGGAGAATC^TATAG^ 

TC^CCACTGGGGT^AAATTTAGTGTACTACAACATTGATTTACTC^GG 

ATTGACTAGTC AGGAGT AACAGG TT CACAGAGAGAAGTTGGTGCTTAGTTATGTGTTTTTTAGAGTATATACTAA 
GCTCTACAGGG ACAG AATG C TTAATAAATAC TT TAATAAGATATG GG AAAATATTTTAATAAAACAAGGAAAACA 
TAATGATGTATAATG CATC CTG ATGGGAAG GCATG CAGATGGGATTTGTTAG AAGACAGAAGGAAAGAC AGCCAT 
AAATTCTGGCTTTGGGGAAAACTCATATCCCCATGAAAAG 

TGG AG C T CTTTT CACT AGG G TAT AA GTAG CT G C C AATTTGT AATT C AT C T GT TAAAAAAAAT C TAGATT AT AACA 
AAC TG CTAGC AAAAT CTGAGG AAACATAAATTCTTCTGAAGAATC AT AGGAAGAGTAGACATTTTATTTATAACC 
AATGATATTTCAGTATATATTTTCTCTCTTTTAAAAAATATTTATCATACTC 
CTTTATTCTCTCCTGTATATTGGATTTT'GTGATTATATTTGA 

GAATTAAGAAAATGACATTT CTGGGGAGTGG G GAT ATAT ATTTGTTG AAT AACAGAACGAGTGT AAAATTTT AA C 
AACGGAAAGC^TTAAATTAACTCTTTGACATCTTCACTCAACCTTTTCTCATTCCTGAGTTAATC^ 
GTAGTATTGTTTTTGTAATTTAACAATAAATAAGC CTGCTACATGT 
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FIGURE 176 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA7l883 
xsubunit 1 of IV 777 aa, 1 stop 
><MW: 89651, pi: 7.97, NX(S/T): 3 

MNANKDERLKARSQDFHLFPALMMLSMTMLFLPVTGTLKQNIPRLKLTYKDLLLSNSCIPFL 
GS S E GL DFQTLLLD EERGRLLLGAKDH I FLLS L VDLNKNF KK I YWP AAKER VE LCKLAGKD A 
NTECANFIRVLQPYNKTHIYVCGTGAFHPICGYIDLGVYKEDIIFKLDTHNLESGRLKCPFD 
PQQPFASVMTDEYLYSGTASDFLGKDTAFTRSLGPTHDHHYIRTDISEHYt^LNGAKFIGTFF 
IPDTYNPDDDKIYFFFRESSQEGSTSDKTILSRVGRVCKNDVGGQRSLINKWTTFLKARLIC 
S I PGSDGADTYFDELQD I YLLPTRDEROTWYGVFTTTSS I FKGSAVCVYSMAD IRAVFNGP 
YAHKESADHRWQYDGRIPYPRPGTCPSKTYDPLIKSTRDFPDDVISFIKRHSVMYKSVYPV 
AGGPTFKR INVDYRLTQ I WDHVT AEDGQ YDVMFLGTD IGTVLKWS I SKEKWNMEEWLEE 
LQIFKHSSIILNMELSLKQQQLYIGSRDGLVQLSLHRCDTYGKACADCCIiARDPYCAWDGNA 
CSRYAPTSKRRARRQDVKYGDP ITQCWD IEDS ISHETADEKVIFG IEFNSTFLECI PKSQQA 
TIKWYIQRSGDEHREELKPDERIIKTEYGLLIRSLQKKDSGMYYCXAQEHTFIHTIVKLTLN 
VI ENEQMENTQRAEHEEGQ VKDLLAE S RLR YKD Y I Q I L S S PNF S LDQ YCEQMWHRE KRRQRN 
KGGPKWKHMQEMKKKRNRRHHRDLDELPRAVAT 

Important features of the protein: 
Signal peptide: 

amino acids 1-36 

N-glycosylation sites, 

amino acids 139-142, 607-610, 724-727 

Tyrosine kinase phosphorylation site. 

amino acids 571-576 

Gram-positive cocci surface proteins •anchoring 1 hexapeptide. 

amino acids 32-37 
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FIGURE 177 

CCCTGACCTCCCTC^CCACACTGAGCT^ 
CAACCTCCCAGGTAAGCTGGGAGCAAGACCTG 

CTCAGCAGTTTCAG CCAGCAGGGACTGATCAGGTGTGTGTC CTGGAGTGGGGAGCAGAAGGCGTGGCTGGCAAGA 

GTGGCCTGGAGAAAGAGGTTCAGCGCTTGACCAGCCGAGCTGCCCGTGACTACAAGATCCAGAACCATG 

GGGTGAGGTGGGGGGGCACAGGTGTCATGTGCACCTTCTTGTCT 

^CAT^GG^ 

AAGGGAGTGACTTAACCTCTCTGGACTTCAATTTCCTCATCACTAAAGTAGGGCGAATA^ 

AGGGAAGATTAAATGACATAATGTATGTGA^GCAACTAGCAAAGTACCAGTCCCATAGTAAGTCATGCCCCACAG 
TATTT C CAC CC AC CC CTGTT CTC TGCCTTC C C AACCAGG T ACTG CAACGACTGGAG CAGAGG CGGCAG CAGGCTT 

CAGAGCGGGAGGCTCCAAGCATAGAACAGAGGTTACAGGAAGTGCGAGAGAGCATCCGCCGGGCACAGGTGAGCC 
AGGTGAAGGGGGCTGCCCGGCTGGCCCTGCTGCAGGGGGCTGGCTTAGATGTGGAGCGCTGGCTGAAG 
TGACCCAGGCCCAGGATGAGGTGGAGCAGGAGCGGCGGCTCAGTGAGGCTCGGCTGTCCCAGAGGGACCTCTCTC 
CAACCGCTGAGGATGCTGAGCTTTCTGACTTTGAGGAATGTGAGGAGACGGGAGAGCTCTTTGAGGAGCCTGCCC 
CC CAAGCCCTGG CCACGAGGGCC CTC CCCTGCCCTG CACACGTGGTATTTCGCT ATCAGGCAGGGCGTGAGGATG 

AGCTGACAATCACGGAGGGTGAGTGGCTGGAGGTCATAGAGGAGGGAGATGCTGACGAATGGGTCAAGGCTCGGA 
ACCAGCACGGCG^GGTAGGCTTTGTCCCT^^ 

AAGACAGTGACAATCCCTGCGGGGCAGAGCCCACAG CATTCCTGGCACAGGCCCTGTACAGCTACAC CGGACAGA 

gtgcagagc^gctgagcttccctgagggggcactcatccgtctgctgccccgggcccaagatggag™ 

GCTTCTGGAGGGGAGAATTTGGGGGCCGTGTTGGGGTCT^ 



CTACCTCTGTGTTGGATGGGCCCCCTGCACCTGTCCT 

ACATGATGGCACCTCGACTCAGGCCGATGCGTCCACCACCTCCCCCGCCGGCTAAAGCCCCGGATCCTC 

C^GATCCCCTCACCTGAAGGCCAGGGAAGCCTTGACCCCCAGTGATGCTGOTGTCCCTATOT 

CCACACCATCAATGATCCAGAGCAACACAGCCAAAAGCTGGAATCGCCC 

GGAAACTTGCCCCTTCCCATTTCTAGAGCTGGAACCCACTCCTTTTTTTCCC^ 

GGAACTACTACCTTCTCTTCTGTCATGACCCTATCTAGGGTGGTGAAATGCCTGAAATCT 

ATCCATCAAGGTCTCTAGTAGTTCTGGCCCAC CTCTTTCCCCACCCTGGCTC CATGACCCACCCCACTCTGGATG 

CCAGGGTCACTGGGGTTGGGCTGGGGAGAGGAACAGGCCTTGGGAATCAGGAGCTGGA^ 

CTGTAATGGTCTX3AGCGGATTTATTGACAATGAATA 

CTAAGAGGGCAGGGGGCCTACGGTGCTATTGCTTTAGGGGCCCACCACGGGCAGGGGCCT^ 

GCTCTATCATATGGAGCGAGGTGTTGGGGAAGGCGGGGCAGGCAGCCTGTTGCAGGCAGGGGAAGGAG 

TGAGGGGCTGTGACCTCTCCTGAGGCCCCCAGCCTGAGACTGTGCAACTCCAGGTGGAAGTAGA^ 

AGCTGGGGGGCAGTGCTGTCCAGTGGAGGGGAGGGCTTTCACGCCCACCCACCCCCTGGCCCTGCCAGCTGGT^ 

TCCATCAGCACAATGAAGGAGAOTGGAGAAGAGGAAGAATAACACTGTTC 

TTTTCCCCTCSGGGCTCCAGGACCTTCCCTACCTCCACCACC^CCAAG^ 

AGTTTACTCTGGGGGTTC^GGGAGCCGAAAGGCITAAATAGTTTAAGTAGGTGATC 

TTTAGGGCTCAGGCAGACT CACCTC ACATACTC CCTGCTCC CTGTGGTAGAGACACCTGAGAGAAAGGGGAGGGG 

TCAACAATGAGAGACCAGGAGT AGGTC CTATCAGTGCCCC CCAGAGTAGAGAGCAATAAGAGCCCAGCCCAGTGC 

AGTCCCGGCTGTGTTTTCCTACCTCGTGATCAGAAGTGTCTGGTTTGCTTGGCTGCCC^ 

GCAGCCCTGGGCTTGGGCCCCTCCCTCCGGCCCTCAGTGTTGGCTCTGCAGAAOT 

CACGAGGGGTTAGGCTGCTGTCCCTGAGTCCTCCATTCTGTACT 

TCTCAGGGGG<^CrCTCCATGGCAGG<^TCCCrrGCCTTG^ 



TCTCAATGTGTGTCACCCGG AACC TG GG AGGGGAGGGAACACTGGGGTTTAGGACCACAACTCAGAGGCTGCTTG 
GCCCTCCCC TCTGACCAGGGACATC CTGAGTTTGGTGGCTACTTCCCTCTGGCCTAAGGTAGGGGAGGCCTTCTC 
AGATTGTGGGGCACATTGTGTAGCCTGACTTCTGCTGGAGCTCCCAGTCCAGGAGGAAAGAGCCAAGGCCCACT 
TTGGGATCAGGTGCCTGATCACTGGGCCCCCTACCTCAGCCCCCCTTTCCCTGGAGCACCT 
CAGAGAACACAGTGGTCTCCCCTGTCCGGGGGCGGCTTTTTCCTTCCT 

GCCTCTTGCTGCGGCTGCAATGGATGCAAGGGGCTGCAGAGCCCAGGTGCACTGTGTGATGATGGGA 

CGTCCTGCAGGCTGGAGGTGGCATCCACACTGGACAGCAGGAGGAGGGGAGTGAGGGTAACATTTCC^ 

TCATGTTTTGTTTCTTACGTTCT^ 

TTTCTTGTCTTTATC TAATAAAC TCAAT ATTAAG 



'27D 
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FIGURE 178 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA73401 
xsubunit 1 of 1, 3 70 aa, l stop 
><MW: 40685, pi: 4.53, NX (S/T) : 0 

MQLAKYQSHSKSCPWFPPTPVLCLPNQVLQRLEQRRQQASEREAPSIEQRLQEVRESIRRA 
QVSQVKGAARLALLQGAGLDVERWLKPAMTQAQDEVEQERRIiSEARLSQRDLSPTAEDAELS 
DFEECEETGELFEEPAPQALATRALPCPAHWFRYQAGREDELTITEGEWLEVIEEGDADEW 
VKARNQHGEVGFVPERYLNFPDLSLPESSQDSDNPCGAEPTAFLAQALYSYTGQSAEELSFP 
EG AL I RLL PRAQDG VDDG FWRGE FGGR VGVF P S LL VE ELLG PPGPPELSD PEQM LPSPSPPS 
FSPPAPTSVLDGPPAPVLPGDKALDFPGFLDMMAPRLRPMRPPPPPPAKAPDPGHPDPLT 
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FIGURE 179 A 

CACAGG GAGAC C CA.CAGACACAT ATGCACGAGAGAG ACAGAGG AG GAAAGAGACAGAGACAAAGGC AC AG CG GAA 
GAAGGCAGAGACAG GG CAG GCAC AG AAGCGG CCCAGACAG AG TC C TA C AGAGG GAGAGG C CAGAG AAG CTG CAGA 

AGACACAGGCAGGGAGAGACAAAGATCCAGGAAAGGAGGGCTCAGGAGGAGAGTTTGGAGAAGCCAGACCCCTC 

GCACCTCTCCCAAGCCCAAGGACrAAGTTTTCTCCATTTC 

TCTGACCTTGGCAGGAGTCCAAGCCCCCAGGCTACAGAGAGGAGCTTT 

GCCCTAGACGGGCTCAGTCC CTCCCAGCTGCAGTACCAGTGCCATGTC CCAGACAGG CT CGCATCCCGGGAGGGG 
CTTGGCAGGGCGCTGGCTGTGGGGAGCCCAACCCTGCCTCCTGCTCCCCATTGTGCCGCTCTCCTGGCTGGTGTC 
GCTGCTTCTGCTACTGCTCMCCTCTCTCCTGCCCTCAGCCCGGCTGGCCAGCCC 

CGTGTTTCCAGAGAAGCTCAACGGCAGCGTCCTGCCTGGCTCGGGCGCCCCTGCCAGGCTGTTGTGCCGCTTGCA 
GGCCTTTGGGGAGACGCTGCTACTAGAGCTGGAGCAGGACTCCGGTGTGCAGGTCGAGGGGCTGACAGTGCAGTA 
CCTGGGCCAGGCGCCTGAGCTGCTGGGTGGAGGAGAGCCTGGQACCTACCTGACTGG 

GGAGTCGGTGGCATCTCTGCACTGGGATGGGGGAGCCCTGTTAGGCGTGTTACAATATCGGGGGGCTGAACTCCA 

CCTCCAGCCCCTGGAGGGAGGCACCCCTAACTCTGCTGGGGGACCTGGGGCTCACATCCTACGCCGGAAGAGTCC 

TGCCAGCGGTCAAGGTCCCATGTGCAACGTCAAGGCTCCTCTTGGAAGCCCCAGCCCCAGACCCCGAAGAGCCAA 

GCGCTTTGCTTCACTGAGTAGATTTGTGGAGACACTGGTGGTGGCAGATGACAAGATGGCCGCATTCCACGGTGC 

GGGGCTAAAGCGCTACCTGOTAACAGTGATGGCAGCAGCAGCCAAGGCCTTCAAGCACCCAAGCATCCGCAATCC 

TGTCAGCTTGGTGGTGACTCGGCTAGTGATCCTGGGGTCAGGCGAGGAGGGGCCCCAAGTGGGGCCCAGTGCTGC 

CCAGACCCTGCGCAGCTTCTGTGCCTGGCAGCGGGGCCTCAACACCCCTGAGGACTCGGGCCCTGACCACTTTGA 

CACAGCCATTCTGTTT AC CC GTCAGGACCTGTGTGGAGTCTC CACTTGCGACACG CTGGGTATGGCTGATGTGGG 

CACCGTCTGTGACCCGGCTCGGAGCTGTGCCATTGTGGAGGATGATGGGCTCCAGTCAGCCTTCACTGCTGCTCA 

TGAACTGGGTCATGTCTTCAACATGCTCCATGACAACTCCAAGCCATGCATCAGTTTGAATGG 

CTCTCGCCATGTCATGG CC C CTGTG ATGGCTCATGTGGATC CTGAGGAGCCCTGGTCCCCCTGCAGTGCC^ 

CATCACTGACTTCCTGGACAATGGCTATGGGCACTGTCTCTTAGACAA 

GACTTTC CCTGGCAAGGAC TATGATGCTGACCGCCAGTGCCAGCTGACCTTCGGGCCCGACTCACGC CATTGTCC 
ACAGCTGCCGCCGCCCTGTGCTGCCCTCTGG^ 

CTCGCCCTGGGCCGATGGCACACCCTGCGGGCCCGCACAGGCCTGCATGGGTGGTCGCTGCCTCCACATGGACC^ 
GCTCCAGGACTTCAATATTCCACAGGOTGGTGGCTGGGGTCCTTGGGGACCATGGG 

TGGGGGTGGTGTCCAGTTCTCCTCCCGAGACTGCACGAGGCCTGTCCCCCGGAATGGTGGCAAGTACTGTGA 

CCGCCGTACCCGCTTCCGCTCCTGCAACRCTGAGGACTGCCCAACTGGCTCAGCCCrGACOT 

GTGTGCTGCCTACAACCACCGCACCGACCTCTTCAAGAGCT 

AGGCGTGGCCCCCCAGGACCAGTGCAAACTC^CCTGCCAGGCCCGGGCACTGGGCTACTACTATGTGCTGGAGCC 

ACGGGTGGTAGATGGGACCCCCTGTTCCCCGGACAGCTCCTCGGTCTGTGTCCAGGGCCGATGCATCCATGCTGG 

CTGTGATCGCATCATTGGCTTCCAAGAAGAAGTTTGACAAGTGCATGGTGTGCGGAGGGGACGGTTCT 

CAAGCAGTCAGGCTCCTTCAGGAAATTCAGGTACGGATACAACAATGTGGTCACT ATC CCCGCGGGGG CCACCCA 

CATTCTTGTCCGGCAGCAGGGAAACCCTGGCCACCGGAGCATCTACTTGGCCCTGAAGCTGCCAGATG 

^GCCCTCAATGGTGAATACACGCTGATGCCCTCCCCC^CAGATGT 

CAGCGGGGCCACTGCAGCCTCAGAGACACTGTCAGGCCATGGGCCACTGGCCCAGCCT 

AGTGGCTGGCAACCCCCAGGACACACGCCTCCGATACAGCTTCTTCGTGCCCCGGCCGACCCCT 

CCCCACTCCCCAGGACTGGCTGCACCGAAGAGCACAGATTCTGGAGATCCTTCGGCGGra 

GAAA^CCTCACTATCCCGGCTGCCCTTTCTGC^CACCGGGGCCTCGGACTTAGCTGGGAGAAA 

CTGTTGCTGCCTCATGCTAAGACrCAGTGGGGAGGGGCro 

GCGCAGGCTGGCCCTGC C CTGGTTTCCTGCCCTGGGAGGCAGTGATGGGTTAGTGGATGGAAGGGGCTGACAG AC 
AGCCCTCCATCTAAACTGCCCCCTCTG^^ 

CAGTTGTATTTATTTAGTATTTATTCACTTTTATTTAGCACCAGGGAAGGGGACAAGGA 

CCTGACCCCTGACCCCTCATAGCCCTCACCCTGGGGCTAGGAAATCCAGGGl^^TGGTGATAGGTATA 

TGTGTATGCGTGTGTGTGTGTGTGTGAAAATGTGTGTGTGCTTATGTATGAGGTACAACCTGTTCTGCTTTCCTC 
TTCCTGAATTTTATTTTTTGGGAAAAGAAAA 

TITTTTTTTCTTTCTTTCTTTCTTTTTTTTTTTTGAGA^ 

GCAa^TCTCGGCTCACTGCATCCTCCGCCTCCCGGGTTCAAGTGATTCTC!ATGCCTC^ 

GGATTACAGGCTCCTGCCACCACGCCCAGCTAATTTTTGTTTTGTTTTGTTTGGAGACAGAGT 

ACCAGGGCTGGAATGATTTCAGCTCACTGCAACCTTCGCC^CCTGGGTTCCAGCAATTCTCOTG^ 

CGAGTAGCTG AGATTAT AGGCACCTAC CACCACGCC CGGCTA\ATTTTTGTATTTTTAQTAGAGACGGGGTTTCAC 

CATGTTGGCCAGGCnKSTCTCGAACTCCTGACCTTAGGTGATCCACTCGCCTTCATCTC 

ACAGGCGTGAGCCACCGTGGCTGGCCACGCCCAACTAATTTTTGTATTTTTAGTAGA 

TGGCCAGGCTGCTCTTG AACTC CTGAC CTCAGG1AATCGAC CTGCCTCGGCCTCXZCAAAGTGCTGGGATTACAGG 
TCn-GAGCCACCACGCCCGGTACATATrTTTTAAATTGAATTCTACTATTTATGTGATCCT 
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FI GURE 179B 

ATGTGGTTGCATCCTAACTCCATGTCTCTGAGCA 

TTTGTTGTGAGGATT AAATAATGT AAATAAAG AACT AG CATAACACTCAAAAAAAAAAAAAAAAAAAAAAAAAAA 
AAAAAAAAA AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 180 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA73492 
xsuburiit 1 of 1, 837 aa, 1 stop 
><MW: 90167, pi:. 8. 39, NX(S/T): 1 

MSQTGSHPGRGIAGRWLWGAQPCLLLPIVPLSWLVWLLLLLLASLLPSARLASPLPREEEIV 

FPEKLNGSVLPGSGAPARLLCRLQAFGETLLLELEQDSGVQVEGLTVQYLGQAPELLGGAEP 

GTYLTGTINGDPESVASLHWDGGALLGVLQYRGAELHLQPLEGGTPNSAGGPGAHILRRKSP 

ASGQGPMCNVKAPLGSPSPRPRRAKRFASLSRFVETLWADDKJ4AAFHGAGL 

AAKAFKHPS I RNPVSLWTRLVI LGSGEEGPQVGPS AAQTLRS FCAWQRGLNTPEDSGPDHF 

DTAILFTRQDLCGVSTCDTLGMADVGTVCDPARSCAIVEDDGLQSAFTAAHELGHVFNMLHD 

NS KP C I S LNG PL S T S RHVMAP VMAHVD P EE PWS P CS ARF I TD F LDNG YGHCLLD KP E APLHL 

PVTFPGKDYDADRQCQLTFGPDSRHCPQLPPPCAALWCSGHLNGHAMCQTKHSPWADGTPCG 

PAQACMGGRCLHMDQLQDFNIPQAGGWGPWGPWGDCSRTCGGGVQFSSRDCTRPVPRNGGKY 

CEGRRTRFRSCNTEDCPTGSALTFREEQCAAYNHRTDLFKSFPGPMDWVPRYTGVAPQDQCK 

LTCQARALGYYYVLEPRVVDGTPCSPDSSSVCVQGRCIHAGCDRIIGSKKKFDKCMVCGGDG 

SGCSKQSGSFRKFRYGYNNWTIPAGATHILVRQQGNPGHRSIYLALKLPDGSYALNGEYTL 

MPSPTDWLPGAVSLRYSGATAASETLSGHGPLAQPLTLQVLVAGNPQDTRLRYSFFVPRPT 

PSTPRPTPQDWXiHRRAQILEILRRRPWAGRK 

Important features of the protein: 

Signal peptide: 

amino acids 1-48 

N-glycosylation site. 

amino acids 68-71 

Glycosaminoglycan attachment site 

amino acids 188-191, 772-775 

cAMP- and cGMP- dependent protein kinase phosphorylation site. 

amino acids 182-185 

Tyrosine kinase phosphorylation site, 
amino acids 73 0-736 
N-myristoylation sites. 

amino acids 5-10, 19-24, 121-126, 125-130, 130-135, 147-152, 167- 

172, 168-173, 174-179, 323-328, 352-357, 539-544, 555-560, 577- 

582, 679-684, 682-687, 763-768 

Amidation sites. 

amino acids 560-563, 834-837 

Leucine zipper pattern. 

amino acids 17-38, 24-45 

Neutral zinc metallopeptidases, zinc-binding region signature. 

amino acids 358-367 
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FIGURE 181 

CAGCAGTGGTCTCTCAGTCCTCTCAAAGCAAGGAAAGAGTACTGTGTGCTGAGAGACCAIOG 
C AAAGAAT C C T C C AG AG AAT TGTGAAG ACT GT CA C ATT CT AAAT G C AG AAG CTTTT AAAT C C 
AAGAAAATATGTAAATCACTTAAGATTTGTGGACTGGTGTTTGGTATCCTGGCCCTAACTCT 
AATTGTCCTGTTTTGGGGGAGCAAGCACTTCTGGCCGGAGGTACCCAAAAAAGCCTATGACA 
TGGAG CACACTTTCTACAGC AATGGAGAGAAG AAGAAG ATTT AC ATGGAAAT TG ATCCTGTG 
AC CAGAACTGAAAT AT TCAGAAG C GG AAAT GG CACTGATGAAACATTGGAAGTGCACGACTT 
TAAAAACGGATACACTGG CATCTACT TCGTGGGT CTT CAAAAATGTTTTAT C AAAACT CAGA 
TTAAAGTGATTCCTGAATTTTCTGAACCAGAAGAGGAAATAGATGAGAATGAAGAAATTACC 
ACAACTTT CTTTGAACAGTCAGTGAT TTGGGT CCCAGCAGAAAAGCCTATTGAAAACCGAGA 
TTTTCTTAAAAATTCCAAAATTCTGGAGATTTGTGATAACGTGACCATGTATTGGATCAATC 
CCACT CTAATAT CAGTTT CTGAGTTACAAGACTTTG AGGAGGAGGGAGAAGAT C TT CACTTT 
CCTGCCAACGAAAAAAAAGGGATTGAACAAAATGAACAGTGGGTGGTCCCTCAAGTGAAAGT 
AGAGAAGACCCGTCACGCCAGACAAGCAAGTGAGGAAGAACTTCCAATAAATGACTATACTG 
AAAATGGAATAGAATTTGATCCCATGCTGGATGAGAGAGGTTATTGTTGTATTTACTGCCGT 
CGAGGCAACCGCTATTGCCGCCGCGTCTGTGAACCTTTACTAGGCTACTACCCATATCCATA 
CTGCTACCAAGGAGGACGAGTCATCTGTCGTGTCATCATGCCTTGTAACTGGTGGGTGGCCC 
GCATGCTGGGGAGGGTCTAATAGGAGGTTTGAGCTCAAATGCTTAAACTGCTGGCAACATAT 
AATAAATG CATG CT ATTCAATG AATTTCTGCCTATGAGG CATCT GG C C C CTGGTAG CCAGCT 
CTCCAGAATTACTTGTAGGTAATTCCTCTCTTCATGTTCTAATAAACTTCTACATTATCACC 
AAAAAAAAAAAAAAAAAAA 



WO 00/12708 



PCT/US99/20111 



FIGURE 18 2 

></usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA73727 
xsubunit l of 1, 317 aa, 1 stop 
><MW: 37130, pi: 5.18, NX(S/T); 3 

MAKNP PENCE DCH I LNAEAF KS KK I C KS LK I C GL V FG I LALTL I VL FWGS KHFWPEVPKKAY 
DMEHT F YSNGEK KK I YME I D P VTRTE I F RS GNGTD E TLE VHD F KNG YTG I Y FVGLQKCF I KT 
QIKVIPEFSEPEEEIDENEEITTTFFEQSVIWPAEKPIENRDFLKNSKILEICDNVTMYWI . 
NP TL I S VS ELQD FEEEGEDLHF PANE KKGI EQNEQWWPQ VKVEKTRHARQASEEELP IND Y 
TENGIEFDPMLDERGYCCIYCRRGNRYCRRVCEPLLGYYPYPYCYQGGRVICRVIMPCNWWV 
ARMLGRV 

Important features of the protein: 
Signal peptide: 

amino acids 1-4 0 

Transmembrane domain: 

amino acids 25-47 (type II) 

N-glycosylation sites, 

amino acids 94-97, 180-183 

Glycosaminoglycan attachment sites. 

amino acids 92-95, 70-73, 85-88, 133-136, 148-151, 192-195, 239- 
242 

N-myristoylation sites. 

amino acids 33-38, 95-100, 116-121, 215-220, 272-277 

Microbodies C- terminal targeting signal. 

amino acids 315-317 

Cytochrome c family heme-binding site signature. 

amino acids 9-14 
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FIGURE 183 

GCGGAACTGGCTCCGGCTGGCACCTGAGGAGCGGCGTGACCCCGAGGGCCCAGGGAGCTGCC 
CGGCTGGCCTAGGCAGGCAGCCGCACC^ISGCCAGCACGGCCGTGCAGCTTCTGGGCTTCCT 
GCTCAGCTTCCTGGGCATGGTGGGCACGTTGATCACCACCATCCTGCCGCACTGGCGGAGGA 
CAGCGCACGTGGGCACCAACATCCTCACGGCCGTGTCCTACCTGAAAGGGCTCTGGATGGAG 
TGTGTGTGGCACAGCACAGGCATCTACCAGTGCCAGATCTACCGATCCCTGCTGGCGCTGCC 
CCAAGACCTCCAGGCTGCCCGCGCCCTCATGGTCATCTCCTGCCTGCTCTCGGGCATAGCCT 
GCGCCTGCGCCGTCATCGGGATGAAGTGCACGCGCTGCGCCAAGGGCACACCCGCCAAGACC 
ACCTTTGCCATCCTCGGCGGCACCCTCTTCATCCTGGCCGGGCTCCTGTGCATGGTGGCCGT 
CTCCTGGACCACCAACGACGTGGTGCAGAACTTCTACAACCCGCTGCTGCCCAGCGGCATGA 
AGTTTGAGATTGGCCAGGCCCTGTACCTGGGCTTCATCTCCTCGTCCCTCTCGCTCATTGGT 
GGCACCCTGCTTTGCCTGTCCTGCCAGGACGAGGCACCCTACAGGCCCTACCAGGCCCCGCC 
CAGGGCCACCACGACCACTGCAAACACCGCACCTGCCTACCAGCCACCAGCTGCCTACAAAG 
ACAATCGGGCCCCCT CAGTGACCTCGGCCACG CACAGCGGGT ACAGGCTGAACGACTACGTG 
IG&GT CCCCACAGCCTGCTT CTCCCCTGGGCTGC TGTGGGCT GGGT CC CCGGCGGG ACTGTC 
AATGGAGGCAGGGGTTCC^GCACAAAGTTTACTTCTGGGC^TTTTTGTATCCAAGGAAATA 
ATGTGAATGCGAGGAAATGTCTTTAGAG CACAGGGACAGAGG GGGAAATAAG AGGAGGAGAA 
AGCTCTCTATACCAAAGACTGAAAAAAAAAATCCTGTCTGTTTTTGTATTTATTATATATAT 
TTATGTGGGTGATTTGATAACAAGTT TAAT AT AAAGTGACTT GG GAGTTTGGTCAGTGGGGT 
TGGTTTGTGATCCAGGAATAAACCTTGCGGATGTGGCTGTTTATGAAAAAAAAAAAAA 
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FIGURE 184 



MASTAVQLLGFLLSFLGMVGTLITTILPHWRRTAHVGTNILTAVSYLKGLWMECVWHSTGIY 
QCQI YRSLLALPQDLQAARALMVI SCLLSG IACACAVI GMKCTRCAKGTPAKTTFAILGGTL 
FIIAGLLC1WAVSWTTNDWQNFYNPLLFSGMKFEIGQALYLGFISSSLSLIGGTLLCLSCQ 
DEAPYRPYQAPPRATTTTANTAPAYQPPAAYKDNRAPSVTSATHSGYRLNDYV 

Important features of the protein: 
Signal peptide: 

amino acids 1-21 

Transmembrane domains: 

amino acids 82-103, 115-141, 160-182 
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FIGURE 185 

GAGCTC CCCT CAGGAG CGCGTT AG CTT C AC AC CT T CGG CAGCAGGAGGG CGG CAGCTTCT CG 

CAGGCG GCAGGGCGGGCGGCCAGGATCATSTCCACCACCACATG CCAAGTGGTGGCGTTCCT 

CCTGTCCATCCTGGGGCTGGCCGGCTGCATCGCGGCCACCGGGATGGACATGTGGAGCACCC 

AGGACCTGTACGACAACCCCGTCACCTCCGTGTTCCAGTACGAAGGGCTCTGGAGGAGCTGC 

GTGAGGCAGAGTTCAGGCTTCACCGAATGCAGGCCCTATTTCACCATCCTGGGACTTCCAGC 

CATGCTGCAGGCAGTGCGAGCCCTGATGATCGTAGGCATCGTCCTGGGTGCCATTGGCCTCC 

TGGTATCCATCTTTGCCCTGAAATGCATCCGCATTGGCAGCATGGAGGACTCTGCCAAAGCC 

AACATGACACTGAC CT C C GGGATC ATGTTCATTGT CTC AGGT CTTT GTGCAATTGCTGGAGT 

GTCTGTGTTTGCCAACATGCTGGTGACTAACTTCTGGATGTCCACA.GCrAACATGTACACCG 

GCATGGGTGGGATGGTGCAGACTGTTCAGACCAGGTACACATTTGGTGCGGCTCTGTTCGTG 

GGCTGGGTCGCTGGAGGCCTCACACTAATTGGGGGTGTGATGATGTGCATCGCCTGCCGGGG 

CCTGGCACCAGAAGAAACCAACTACAAAGCCGTTTCTTATCATGCCT^ 

CCTACAAGCCTGGAGGCTTCAAGGCCAGCACTGGCTTTGGGTCCAACACCAAAAACAAGAAG 

ATAT ACGATGGAGGTG CC CG CACAGAGGACGAGGTACAATCTTATC CTTC CAAG CACGACTA 

TGTGTAATGCTCTAAGACCTCTCAGCACGGGCGGAAGAAACTCCCGGAGAGCTCACCCAAAA 

AACAAGGAGAT C CCAT CT AGATTT CTTCTTGCTTTTGACTCACAGCTGGAAGTTAGAAAAG C 

CT CGATTT CATCTTTGGAGAGGCCAAAT GGTCTT AG C CTCAGTCTCTGTC TC TAAATATTC C 

ACCATAAAACAGCTGAGTTATTTATGAATTAGAGGCTATAGCTCACATTTTCAATCCTCTAT 

TT CTTTTT TT AAATATAACTTTCTACT CTGATGAGAGAAT GTGGTTTT AATCTCTCT CTCAC 

ATTTTGATGATTTAGACAGACTCCCCCTCTTCCTCCTAGTCAATAAACCCATTGATGATCTA 

TTTCCCAGCTTATCCCCAAGAAAACTTTTGAAAGGAAAGAGTAGACCCAAAGATGTTATTTT 

CTGCTGTTTGAATTTTGTCTCCCCACCCCCAACTTGGCTAGTAATAAACACTTACTGAAGAA 

GAAGCAATAAGAGAAAGATATTTGTAAT CTCT CC AG CC CATG AT CT CGGTTTTC TT ACACTG 

TGATCTTAAAAGTTACCAAACCAAAGTCATTTTCAGTTTGAGGCAACCAAACCTTTCTACTG 

CTGTTGACAT CTTCTTATT ACAGCAACA CCATTCTAGGAGTTT C CTGAGCT CTC CACTGGAG 

TTAAGT C C TAAATATAGTTAAAAT AAAT AATGTTTTAGTAAAATGATACACTAT CTCTGTGA 
AATAGC CT CAC C CCTA CATGTGGATAGAAGGAAATGAAAAAATAATTGCTTTGACATTGT CT 
ATATGGTACTTTGTAAAGTCATGCTTAAGTACAAATTCCATGAAAAGCTCACACCTGTAATC 
CTAG CACTTTGGGAGG CTGAGGAGGAAGGATCACTTGAGC CCAG AAGTTCGAGACTAGCCTG 
GG CAACATGGAG AAGC C CTGTCTC TACAAAATACAGAGAGAAAAAATCAGC CAGTCATGGTG 
GCATACACCTGTAGTCCCAGCATTCCGGGAGGCTGAGGTGGGAGGATCACTTGAGCCCAGGG 
AGGT TGGGGC TG CAGTGAGC CATGAT CACAC CACTGCACT CCAGCCAGGTGACATAGCGAGA 
TC CT GT CT AAAAAAAT AAAAAAT AAAT AATGGAACACAG C AAGT C C T AGG AAGTAGG T T AAA 
ACTAATT CTTTAA 
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FIGURE 186 



></usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA73 734 
xsubunit 1 of 1, 261 aa, 1 scop 
><MW: 27856, pi: 8.50, NX(S/T): 1 

MSTTTCQWAFLLSILGLAGCIAATGMDMWSTQDLYDNPVTSVFQYEGLWRSCVRQSSGFTE 
CRPYFTILGL PAMLQAVRALM I VG I VLGAI GLLVS I FALKCIRI GSMEDSAKANMTLTSG IM 
FIVSGLCAIAGVSVFAmLVTNFWMSTANMYTGMGGWQTVQTRYTFGAALFVGWVAGGLTL 
IGGVMMCIACRGLAPEETNYKAVSYHASGHSVAYKPGGFKASTGFGSNTKNKKIYDGGARTE 
DEVQS YPS KHDYV 

Signal peptide: 

amino acids 1-23 

Transmembrane domains: 

amino acids 81-100, 121-141, 173-194 
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FIGURE 187 

GGAAAAACTGTTCTCOTCTGTGG 

GAGTCC AGCTGGCTAAAACT CAT CC CAGAGG ATA£I£GCAACC CATG CCTT AGAAAT CG CTG 
GGCTGTTTCTTGGTGGTGTTGGAATGGTGGGCACAGTGGCTGTCACTGTCATGCCTCAGTGG 
AGAGTGTCGGCCTTCATTGAAAACAACATCGTGGTTTTTGAAAACTTCTGGGAAGGACTGTG 
G ATGAATTGCGTGAGGCAGGCT AACATCAG GATG CAGTGCAAAATCTATGATTC C CTGCTGG 
CTCTTTCTCCGGACCTACAGGCAGCCAGAGGACTGATGTGTGCTGCTTCCGTGATGTCCTTC 
TTGGCTTTCATGATGGCCATCCTTGGCATGAAATGCACCAGGTGCACGGGGGACAATGAGAA 
GGTGAAGGCTCACATTCTGCTGACGGCTGGAATCATCTTCATCATCACGGGCATGGTGGTGC 
TCAT CC CT GTGAGCTGGGTT GC CAATGC CATCAT CAGAGATTT CTAT AACTCAATAGTGAAT 
GTTGCCCAAAAACGTGAGCTTGGAGAAGCTCTCTACTTAGGATGGACCACGGCACTGGTGCT 
GATTGTTGGAGGAGCTCTGTTCTGCTGCGTTTTTTGTTGCAACGAAAAGAGCAGTAGCTACA 
GATACTCGATACCTTCCCATCGCACAACCCAAAAAAGTTATCACACCGGAAAGAAGTCACCG 
AGCGT CTACT CCAGAAGT CAGTATGTGTAGTTGTGT AT GTTTTTT TAACTTTACTATAAAGC 
CATG CAAATG ACAAAAAT CTAT ATTACTTT CTCAAAATGGACCCCAAAGAAACT TT GATTTA 
CTGTTCTTAACT GC CTAATCTT AATT ACAGGAACTGTGCAT CAGCTATTT AT GATT CTATAA 
GCTATTTCAGCAGAATGAGATATTAAACCCAATGCTTTGATTGTTCTAGAAAGTATAGTAAT 
TTGTTTTCTAAG GTGGTT CAAGCATCTACTCTTTTTATCATTTACT T C AAAATGACATTGCT 
AAAGACTGCATTATTTTACTACTGTAATTTCTCCACGACATAGCATTATGTACATAGATGAG 
TGTAACATTTATATCTCACATAGAGACATGCTTATATGGTTTTATTTAAAATGAAATGCCAG 
TC CATT ACACT GAATAAATAGAACTCAACTATTGCTTTTCAGGG AAAT CATGGATAGGGTTG 
AAGAAGGTTACTATTAATTGTTTAAAAACAGCTTAGGGATTAATGTCCTCCATTTATAATGA 
AGATTAAAATGAAGGCTTTAAT CAG CATTGTAAAGGAAAT TGAATGGCTTTCTGAT ATGCTG 

TTCTTGTGTATTAAATTAACATTTTTAAAACGCAGATATTTTGTCAAGGGGCTTTGCATTCA 
AACTGCTTTTCCAGGGCTATACTCAGAAGAAAGATAAAAGTGTGATCTAAGAAAAAGTGATG 

GAAATCATATATGTATGGATATATTTTAATAAGTATTTGAGTACAGACTTTGAGGTTTCATC 
AATATAAATAAAAGAGCAGAAAAATATGTCTTGGTTTTCATTTGCTTACCAAAAAAACAACA 
ACAAAAAAAGTTGT CCTTTG AG AACTT C AC CT GCT CC TATGTGGGT ACCTGAGTCAAAATTG 
TCATTTTTGTTCTGTGAAAAATAAATTTCCTTCTTGTACCATTTCTGTTTAGTTTTACTAAA 
ATCTGTAAAT ACTG TATTTT TCTGTTTATT CCAAATTTGATGAAACTGACAATC CAATTTGA 
AAGTTTGT GT CG ACGTCTGT CTAGCTTAAATGAATGTGTTC TATTT G CTTTATACATTTATA 
TTAATAAATTGTACATTTTT CTAATT 



WO 00/12708 
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FIGURE 188 



></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA73735 
xsubunit 1 of 1, 225 aa, 1 stop 
><MW: 24845, pi: 9.07, NX(S/T): 0 



MATHALE I AGLFLGGVGMVGTVAVTVMPQWRVS AF I ENN I WFENFWEGLWMNCVRQANIRM 
QCTIYDSLLALSPDLQAARGIMO^VMSFLAFMM^ 

IFI ITGMWLIPVSWVANAI IRDFYNSIVNVAQKRELGEALYLGWTTALVLIVGGALFCCVF 
CCNEKSSSYRYS I PSHRTTQKS YHTGKKSPSVYSRSQYV 

Signal peptide: 

amino acids 1-17 

Transmembrane domains: 

amino acids 82-101, 118-145, 164-188 




WO 00/12708 



PCT/US99/201I1 



FIGURE 139 

TCGCCATGGCCTCTGCCGGAATGCAGATCCTGGGAGTCGTCCTGACACTGCTGGGCTGGGTG 
AATGGCC7TGGTCTCCTGTGCCCTGCCCATGTGGAAGGTGACCGCTTTCATCGGCAACAGCAT 
CGTGGTGGCCCAGGTGGTGTGGGAGGGCCTGTGGATGTCCTGCGTGGTGCAGAGCACCGGCC 
AGATGCAGTGCAAGGTGTACGACTCACTGCTGGCGCTGCCACAGGACCTGCAGGCTGCACGT 
GCCCTCTGTGTCATCGCCCTCCTTGTGGCCCTGTTCGGCTTGCTGGTCTACCTTGCTGGGGC 
CAAGTGTACCACCTGTGTGGAGGAGAAGGATTCCAAGGCCCGCCTGGTGCTCACCTCTGGGA 
TTGTCTTTGTCATCTCAGGGGTCCTGACGCTAATCCCCGTGTGCTGGACGGCGCATGCCATC 
ATCCGGGACTTCTATAACCCCCTGGTGGCTGAGGCCCAAAAGCGGGAGCTGGGGGCCTCCCT 
CTACTTGGGCTGGGCGGCCTCAGGCCTTTTGTTGCTGGGTGGGGGGTTGCTGTGCTGCACTT 
GCCCCTCGGGGGGGTCCCAGGGCGCCAGCCATTACATGGCCCGCTACTCAACATCTGCCCCT 
GC CAT CT CT C GGGGGC CCTCTGAG TAC C CTAC CAAGAATTACGTCTGACGTG GAGGGGAATG 
GOGGC T C CG CTGGC GCTAGAG C CATCCAGAAGTGGCAGTGC C CAACAG CTTTGGGATGGGTT 
CGTAC CT TTTGTTT CTGC CTC CTGCTATTTTT CTTTTGACTGAG GATATTTAAAATTC ATTT 
GAAAACT G AGC CAAGGTGTTGACTC AGACTCTCACT TAGGCTCT GC TGTTTCTCAC CCTT GG 
ATGATGGAG CCAAAGAGGGGATG CTTTGAGATTCTG GATCTTGACATG CC CATCTTAGAAGC 
CAGTCAAG CTATGG AACTAATGC GGAGG CTGCTTG CTG TGCTGG CT TTGCAACAAGACAGAC 
TGTCCCCAAGAGTTCCTGCTGCTGCTGGGGGCTGGGCTTCCCTAGATGTCACTGGACAGCTG 
CCCCCCATCCTACTCAGGTCTCTGGAGCTCCTCTCTTCACCCCTGGAAAAACAAATCATCTG 
TTAACAAAGGACTGCCCACCTC CGGAACTT CTGACCTCTGTTT CCTCCGTCCTGATAAGACG 
TCCACCCCCCAGGGCCAGGTCCCAGCTATGTAGACCCCCGCCCCCACCTCCAACACTGCACC 
CTTCrGCCCTGCCCCCCTCGTCTCACCCCCTTTACACTCACATTTTTATCAAATAAAGCATG 
TTTTGTTAGTGCA 



tfl/2.70 
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FIGURE 190 



></usr/seqdb2/sst/DNA/Dnaseqs .min/ss .DNA73736 
xsubunit 1 of 1, 220 aa, 1 stop 
><MW: 23292, pi: 8.43, NX(S/T): 0 

MAS AGMQ I LGWLTLLGWVNGL VS CALPMWKVTAFI GNS I WAQWWEGLWMS C WQSTGQM 
QCKVYDSLLALPQDLQAARALCVIALLVALFGLLVYIAGAKCTTCVEEKDSKARLVLTSGIV 
FVISGVLTLI PVCWTAHAI IRDFYNPLVAEAQKRELGASLYLGWAASGLLLLGGGLLCCTCP 
SGGSQGPSHYMARYSTSAPAISRGPSEYPTKNYV 



Transmembrane domains: 



amino acids 8-30 (type II), 82-102, 121-140, 166-186 
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FIGURE 191 

GCCAAGGAGAACATCATCAAAGACITCT 

AGCATCTTCTACCACTCCGAATTGAACCAGTCTTCAAAGTAAAGGCAATGGCATTTTATCCC 
TTGCAAATTGCTGGGCTGGTTCTTGGGTTCCTTGGCATGGTGGGGACTCTTGCCACAACCCT 
TCTGCCTCAGTGGTGGAGTATCAGCTTTTGTTGGCAGCAACATTATTGTCTTTGAGAGGCTC 
TGGGAAGGGCTCTGGATGAATTGCATCCGACAAGCCAGGGTCCGGTTGCAATGCAAGTTCTA 
TAGCTCCTTGTTGGCTCTCCCGCCTGCCCTGGAAACAGCCCGGGCCCTCATGTGTGTGGCTG 
TTG CT CTCT C CTTG ATCG CC CT GCTTATTGGCATCTGT GG CATGAA.GCAGGT C CAGTGCACA 
GG CT CTAACG AGAGGG C C AAAG CATAC CTT CT GGGAACTTCAGGAGTCCTCTTCATC CTGAC 
GGGTATCTTC GTTCTGATTCCGGTGAGCTGGACAGCCAATATAATCATCAGAGATTTC TACA 
ACCCAGCCAT CCAC ATAGGT CAGAAACGAGAGCTGGGAGCAGCACTTTTCCTTGGCTGGGCA 
AG CG CTG CTG TC CT CTT C ATTGGAGGGGGT CTGCTTTGTGGATTTTG CTG CTG CAACAGAAA 
GAAG CAAGGG TACAGATATCCAGT GCCTGGCTACCGTGTGC C ACACACAGAT AAGCGAAGAA 
ATACGACAATGCTTAGTAAGACCTCCACCAGTTATGT CTAATG CCTC CTTTTGG CTC CAAGT 
ATGG ACTATG GT CAATGTTTTTTATAAAGT CCTGCTAGAAAC TGTAAGTATGTG AGG CAGGA 
GAACTTGCTTTATGT CT AGATTTACATTG ATACGAAAG TTTCAATTTGTT ACTG GTGGTAGG 
AATGAAAATGACTTACTTGGACATTCTGACTTCAGGTGTATTAAATGCATTGACTATTGTTG 
GACCCAATCGCTGCTCCAATTTTCATATTCTAAATTCAAGTATACCC^TAATCATTAGCAAG 
TGTACAATGATGGACT ACTT ATTACTTT TTGACC AT CATGTATT AT CTGATAAGAAT CTAAA 
GTTGAAATTGATATT CTATAACAATAAAACATATACCT ATTCTA 
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FIGURE 192 

></usr/seqdb2 /sst /DNA/Dnaseqs . min/ss . DNA7373 7 
xBubunit 1 of 1, 173 aa, 1 stop 
xMW: 18938, pi: 9.99, NX(S/T): 1 
MNCIRQARVRLQCKFYSSLLA^ 

AKAYLLGT S GVL F I LTG I FVL I P VS WTANI 1 1 RD F YNP A I H I GQKRE LGAAL FLGWAS AAVL 
FIGGGLLCGFCCCNRKKQGYRYPVPGYRVPHTDKRRNTTMLSKTSTSYV 

Important: features of the protein: 
Transmembrane domains: 

amino acids 31-51, 71-90, 112-133 

N-glycosylation site. 

amino acids 161-164 



f9S/27Z> 
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FTGTTRE 193 

AGTGACAAT CTCAGAGCAGCTT CT ACAC CACAGCCATT T C CAGC ATGAAGAT C ACTGGGGG T 
CTCCTT CTGCTCTGTACAGTGGT CTATTTCTGTAGC AG CTCAGAAG CT GC TAGT CTGTCTC C 
AAAAAAAGTGGACTGCAGCATTTACAAGAAGTATCCAGTGGTGGCCATCCCCTGCCCCATCA 
CATACCTACCAGTTTGTGGTTCTGACTACATCACCTATGGGAATGAATGTCACTTGTGTACC 
GAGAGCTTGAAAAGTAATGGAAGAGTTCAGTTTCTTCACGATGGAAGTTGCTAAATTCTCCA 
TGGACATAGAGAG AAAGGAATGATATTCTCAT C ATCAT CTTCAT CAT C CC AGGCTCTG ACTG 
AGTTTCTTTCAGTTTTACTGATGTTCTGGGTGGGGGACAGAGCCAGATTCAGAGTAATCTTG 
ACTGAATGGAGAAAGT TTCTGTG CTAC CCCT ACAAACCCATG C CT CACTGACAGACCAGCAT 
TTTTTTTTTAACACGTCAATAAAAAAATAATCTCCCAGA 



WO 00/12708 
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FIGURE 194 

>< /uar /seqdb2 / sst /DNA/Dnaseqs . min/ss . DNA73 73 9 
xsubunit 1 of 1, 85 aa, l stop 
><MW: 9232, pi: 7.94, NX(S/T): 0 
MKITGGLLLLCTVVYFCSSSEAASLSPKKVDCSIYK^ 
ECHLCTESLKSNGRVQFLHDGSC 

Signal peptide: 

amino acids 1-19 



WO 00/12708 
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FIGURE X95 

CCCGCGCCCGGTTCTCCCTCGCAGCACCTCGAAGTGCGCCCCTCGCCCTCCTGCTCGCGCCC 
CGCCGCCATGGCTGCCTCCCCCGCGCGGCCTGCTGTCCTGGCCCTGACCGGGCTGGCGCTGC 
TCCTGCTCCTGTGCTGGGGCCCAGGTGGCATAAGTGGAAATAAACTCAAGCTGATGCTTCAA 
AAACGAGAAGCAC CTGTT CCAACT AAGACT AAAG TGGC CGTT GATGAGAATAAAG C CAAAGA 
ATTCCTTGGCAGCCTGAAGCGCCAGAAGCGGCAGCTGTGGGACCGGACTCGGCCCGAGGTGC 
AGCAGTGGTAC CAGCAGTTT CT CT AC ATGGGC TTTGATG AAG CG AAATTTGAAGATGACATC 
ACCT ATTG GCTTAACAGAG ATCGAAATGGACATGAATACTATGGCG ATTACTAC CAACG TCA 
CTATGATG AAGACT CTGCAATTGG T C CC CGGAGC C C CTACGGCTTTAGGC ATGGAGCCAG CG 
TCAACTACGATGACTACTAACCATGACTTGCCACACGCTGTACAAGAAGCAAATAGCGATTC 
T C TTCATG TATC TC CTAATGC CTT AC ACTACTTGGTTTCTGATTTG CTCTATTT CAG CAGAT 
CTTTTCTACCTACTTTGTGTGATCAAAAAAGAAGAGTTAAAACAACACATGTAAATGCCT 
TGATATTTCATGGGAATGCCrcrCATTTAAAAATAGAAATAAAGC^TTTTGTTAAAAAGA 



/9Z/Z7D 



WO 00/12708 



PCT/US99/20111 



FIGURE 196 

></usr/seqdb2/sst/DNA/Dnaseqs .min/ss . DNA73 742 
xsubunit 1 of 1, 148 aa, 1 stop 
><MW: 17183, pi: 8.77, NX(S/TJ: 0 

MAAS PARPAVLALTGLALLLLLCWGPGG I SGNKLKLMLQKRE AP VPTKTKVAVDENKAKEFL 
GSLKRQKRQLWDRTRPEVQQV^QQFLYMGFDEAKFEDDITYWLNRDRNGHEYYGDYYQRHYD 
EDS AI GPRS P YG FRHGAS VNYDD Y 

Signal peptide : 

amino acids 1-3 0 
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FIGURE 197 

CGGCTCGAGCCCGCCCGGAAGTGCCCGAGGGGCCGCGATGGAGCTGGGGGAGCCGGGCGCTC 
GGTAGCGCGGCGGGCAAGGCAGGCGCCaSGACCCTGATTGAAGGGGTGGGTGATGAGGTGAC 
CGTC CTTTTCT CGGTG CTTGCCTG C CTT CTGGTG CT GG C C CTTG CC TGGGTCTCAACG CACA 
CCGCTGAGGGCGGGGACCCACTGCCCCAGCCGTCAGGGACCCCAACGCCATCCCAGCCCAGC 
GCAGCCATGGCAGCTACCGACAGCATGAGAGGGGAGGCCCCAGGGGCAGAGACCCCCAGCCT 
GAGACACAGAGGT CAAG CTG CACAGCCAGAGC CCAGCACGGGGTTCACAGCAACACCGCCAG 
CCCCGGACTCCCCGCAGGAGCCCCTCGTGCTACGGCTGAAATTCCTCAATGATTCAGAGCAG 
GTGGCCAGGGCCTGGCCCCACGACACCATTGGCTCCTTGAAAAGGACCCAGTTTCCCGGCCG 
GGAACAGCAGGTGCGACTCATCTACCAAGGGCAGCTGCTAGGCGACGACACCCAGACCCTGG 
GCAGCCTTCACCTCCCTCCCAACTGCGTTCTCCACTGCCACGTGTCCACGAGAGTCGGTCCC 
CCAAATCCCCCCTGCCCGCCGGGGTCCGAGCCCGGCCCCTCCGGGCTGGAAATCGGCAGCCT 
GCTGCTGCCCCTGCTGCTCCTGCTGTTGCTGCTGCTCTGGTACTGCCAGATCCAGTACCGGC 
CCTTCTTTCCCCTGACCGCCACTCTGGGCCTGGCCGGCTTCACCCTGCTCCTCAGTCTCCTG 
G CCTTTGCCATGTACCG CC CGTAGTG CCT CCGCGGG CGCT TGG CAG CGTC GC CGGCCCCTC C 
GGACCTTGCTCCCCGCGCCGCGGCGGGAGCTGCTGCCTGCCCAGGCCCGCCTCTCCGGCCTG 
CCTCTTCCCGCTGCCCTGGAGCCCAGCCCTGCGCCGCAGAGGACTCCCGGGACTGGCGGAGG 
CCCCGCCCTGCGACCGCCGGGGCTCGGGGCCACCTCCCGGGGCTGCTGAACCTCAGCCCGCA 
CTGGGAGTGGGCTCCTCGGGGTCGGGCATCTGCTGTCGCTGCCTCGGCCCCGGGCAGAGCCG 
GGCCGCCCCGGGGGCCCGTCTTAGTGTTCTGCCGGAGGACCCAGCCGCCTCCAATCCCTGAC 
AGCTCCTTGGGCTGAGTTGGGGACGCCAGGTCGGTGGGAGGCTGGTGAAGGGGAGCGGGGAG 
GGGC AG AGGAGTT C C C CGGAAC CCGTGC AGAT T AAAGTAACTGTGAAGTTTTAAAAAAAAAA 
AAAAAAAA 
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FIGURE 19 8 

MTLIEGVGDEVTVLFSVLACIJjVLALAWSTHTO 

RGEAPGAETPSLRHRGQAAQPEPSTGFTATPPAPDSPQEPLVLRLKFLNDSEQVARAWPHDT 
IGSLKRTQFPGREQQVRLIYQGQLLGDDTQTLGSLHLPPNCVLHCHVSTRVGPPNPPCPPGS 
EPGPSGLEIGS L LL PLLLLLLLLLWYCQ I Q YRP F FP LT ATLGLAGF TLLLS LLAF AMYR P 

Signal peptide: 

amino acids 1-31 

Transmembrane domain: 

amino acids 195-217 



2.0//27O 



WO 00/12708 
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FIGURE 199 

GAGATTGGAAACAGCCAGGTTGGAGCAGTGAGTGAGTAAGGAAACCTGGCTGCCCTCTCCAG 
ATT C CCCAGGCTCT CAGAGAAG AT CAG CAGAAAGT CTG CAAG AC CCTAAGAAC CAT CAGC CC 
TCAGCTGCACCTCCTCCCCTCCAAGGATGACAAAGGCGCTACTCATCTATTTGGTCAGCAGC 
TTTCTTGCCCTAAATCAGGCCAGCCTCATCAGTCGCTGTGACTTGGCCCAGGTGCTGCAGCT 
GGAGGACTTGGATGGGTTTGAGGGTTACTCCCTGAGTGACTGGCTGTGCCTGGCTTTTGTGG 
AAAGCAAGTTCAACATATCAAAGATAAATGAAAATGCGGATGGAAGCTTTGACTATGGCCTC 
TTCC AGAT CAACAGCCAC TACTGGTG CAACGATTATAAGAGTTACTCGGAAAAC CTTTGCCA 
CGTAGACTGTCAAGATCTGCTGAATCCCAACCTTCTTGCAGGCATCCACTGCGCAAAAAGGA 
TTGT GT C CGGAG CACGGGGGATGAACAACT GG GTAGAATGGAGGTTG CACTGTTCAGG C C GG 
CCACTCTCCTACTGGCTGACAGGATGCCGCCTGAGAJGAAACAGGGTGCGGGTGCACCGTGG 
AGTCATTCCAAGACTCCTGTCCTCACTCAGGGATTCTTCATTTCTTCTTCCTACTGCCTCCA 
CTTCATGTTATTTTCTT C CCT T CC CATTTACAACTAAAACTGAC C AGAGC C CCAGGAAT AAA 
TGGTTTTCTTGGCTTCCTCCTTACTCCCATCTGGACCCAGTCCCCTGGTTCCTGTCTGTTAT 
TTGTAAACTGAGGACCACAATAAAGAAATCTTTATATTTATCG 



WO 00/12708 
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FIGURE 2QQ 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss .DNA73746 
xsubunit 1 of 1, 148 aa, 1 stop 
><MW: 16896, pi: 6.05, NX(S/T): 1 

MTKALLIYLVSSFIJUiNQASLISRCDLAQVLQLEDLDGFEGYSLSDWLCLAFVESKFNISKI 
NENADGSFDYGLFQINSHYWCNDYKSYSENLCHVDCQDLLNPl^LAGIHCAKRIVSGARGl^ 
NWVEWRLHCSGRPLSYWLTGCRIjR 

Signal peptide: 

amino acids 1-18 
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FIGURE 201 

TCTGACCTGACTGGAAGCGTCCAAAGAGGGACGGCTGTCAGCCCTGCTTGACTGAGAACCCA 
CCAGCTCATCCCAGACACCTCATAGCAACCTATTTATACAAAGGGGGAAAGAAACACCTGAG 
CAGAATGGAATCATTATTTTTTTCCCAAGGAGAAAACCGGGGTAAAGGGAGGGAAGCAATTC 
AATTTGAAGTCCCTGTGAATGGGCTTTCAGAAGGCAATTAAAGAAATCCACTCAGAGAGGAC 
TTGGGGTGAAACTTGGGTCCTGTGGTTTTCTGATTGTAAGTGGAAGCAGGTCTTGCACACGC 
TGTTGGCAAATGTCAGGACCAGGTTAAGTGACTGGCAGAAAAACTTCCAGGTGGAACAAGCA 
ACCCATGTTCTGCTGCAAGCTTGAAGGAGCCTGGAGCGGGAGAAAGCTAACTTGAACATGAC 
CTGTTGCATTTGGCAAGTTCTAGCAACATGCTCCTAAGGAAGCGATACAGGCACAGACCATG 
CAGACT CCAGTT CCTCCTGCTGCT CCTGATGCTGGGATGCGTCCTGATGATGGTGGCGATGT 
TGCACCCTCCCCACCACACCCTGCACCAGACTGTCACAGCCCAAGCCAGCAAGCACAGCCCT 
GAAGCCAGGTACCGCCTGGACTTTGGGGAATCCCAGGATTGGGTACTGGAAGCTGAGGATGA 
GGGTGAAGAGTACAGCCCTCTGGAGGGCCTGCCACCCTTTATCTCACTGCGGGAGGATCAGC 
TG CTGGTGGCCGTGGC CT TACC CC AGGC CAGAAGGAAC CAG AGCCAGGGCAGGAG AGGTGGG 
AG CT AC CG CCTC AT CAAG CAG C CAAGGAGGCAGGAT AAGGAAGCCC CAAAG AGGGACTGGGG 
GGCTGATGAGGACGGGGAGGTGTCTGAAGAAGAGGAGTTGACCCCGTTCAGCCTGGACCCAC 
GTGGCCTCCAGGAGGCACTCAGTGCCCGCATCCCCCTCCAGAGGGCTCTGCCCGAGGTGCGG 
CACCCACTGTGTCTGCAGCAGCACCCTCAGGACAGCCTGCCCACAGCCAGCGTCATCCTCTG 
TTTCCATGATGAGGCCTGGTCCACTCTCCTGCGGACTGTACACAGCATCCTCGACACAGTGC 
CC AGGGCCTTC CTGAAGGAGATCATC CT CGTGGACGACCT CAG C CAGC AAGG ACAACTCAAG 
T CTGCTC TCAGCGAATATGT GGC CAGGC TGGAGGGGGTGAAG TT AC T CAGGAGCAACAAGAG 
GCTGGGTGCCATCAGGGCCCGGATGCTGGGGGCCACCAGAGCCACCGGGGATGTGCTCGTCT 
TCATGGATGCCCACTGCGAGTGCCACCCAGGCTGGCTGGAGCCCCTCCTCAGCAGAATAGCT 
GGTGACAGGAGCCGAGTGGTATCTCCGGTGATAGATGTGATTGACTGGAAGACTTTCCAGTA 
TTAC CC CT CAAAGG AC CTGCAGCG TGGGGTGTTGGACTGGAAGCTGGATTTCCACTGGGAAC 
CTTTGCCAGAGCATGTGAGGAAGGCCCTCCAGTCCCCCATAAGCCCCATCAGGAGCCCTGTG 
GTGC C C GGAG AGGTGGTGGC CATGGACAGACATTACTTCCAAAACACTGGAGCGT ATGACTC 
TCTTATGTCGCTGCGAGGTGGTGAAAACCTCGAACTGTCTTTCAAGGCCTGGCTCTGTGGTG 
GCTCTGTTGAAATCCTTCCCTGCTCTCGGGTAGGACACATCTACCAAAATCAGGATTCCCAT 
TCCCCCCTCGACCAGGAGGCCACCCTGAGGAACAGGGTTCGCATTGCTGAGACCTGGCTGGG 
GT CATT CAAAGAAACCTT CTACAAGCATAG CCCAGAGGCCTTCT CCTT GAGCAAGG CTGAGA 
AG CC AGACTGCATGGAACGCTTGCAGCTGCAAAGGAGACTGGGTTGT C GGACATTC CACTGG 
TTTCTGGCTAATGTCTACCCTGAGCTGTACCCATCTGAACCCAGGCCCAGTTTCTCTGGAAA 
GCTC CA CAACACTGGACTTGGGCTCTGTGCAGACTGC C AGGCAGAAGG GGACAT C CTGGG CT 
GT CC CATGGTGTTGG CTCCTTGCAGTGACAGC CGG CAGCAACAGTACCTGCAG C ACAC CAG C 
AGGAAGGAGATTCACTTTGGCAGCCCACAGCACCTGTGCTTTGCTGTCAGGCAGGAGCAGGT 
GATTCTTCAGAACTGCACGGAGGAAGGC CTGG CCAT CCAC CAGCAG CACTGGGACTTCCAGG 
AGAATGGGATGATTGTCCACATTCTTTCTGGGAAATGCATGGAAGCTGTGGTGCAAGAAAAC 
AATAAAGATTTGTACCTGCGTCCGTGTGATGGAAAAGCCCGCCAGCAGTGGCGATTTGACCA 
GATAAATG CTGTGGATGAAC G ATGAAT GT CAATGT CAGAAGGAAAAGAGAATTTTGGCCATC 
AAAATCCAGCTCCAAG TGAACGTAAAGAGCTTAT ATATTT CATGAAGCTGATC CTTTTGTGT 
GTGTGCTCCTTGTGTTAGGAGAGAAAAAAGCTCTATGAAAGAATATAGGAAGTTTCTCCTTT 
T CACAC CTT ATTT CATTGACTGCTGGCTGCTTA 
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FIGURE 202 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA73760 
xsubunit 1 of 1, 63 9 aa f I stop 
><MW: 73063, pi: 6.84, NX{S/T): 2 

MLLRKRYRHRPCRLQFLLLLLMLGCVIilviMVAMIiHPPHHTLHQTVTAQA 
ESQDWVLEAEDEGEEYSPLEGLPPFISLREDQLLVAVALPQARRNQSQGRRGGSYRLIKQPR 
RQDKEAPKRDWGADEDGEVSEEEELTPFSLDPRGLQEALSARIPLQRALPEVRHPLCLQQHP 
QDSLPTASVILCFHDEAWSTLLRTVHS I LDTVPRAFLKEI ILVDDLSQQGQLKSALSEYVAR 
LEG^KLLRSNKRIiGAIRARMLGATRATGDVLVFMDAHCECHPGWLEPLLSRIAGDRSRVVSP 
VIDVID WKTFQYYPS KDLQRGVLDWKLDFHWE PLPEHVRKALQS PISPIRS PWPGEWAMD 
RHYFQNTGAYDSLMSLRGGENLELSFKAWLCGGSVEILPCSRVGHIYQNQDSHSPLDQEATL 
RNRVRIAETWLGSFKETFYKHSPEAFSLSKAEKPDCMERLQL^ 

YPSEPRPSFSGKLHNTGLGLCADCQAEGDILGCPMVLAPCSDSRQQQYLQHTSRKEIHFGSP 
QHLCFAVRQEQVI LQNCTEEGLAI HQQHWDFQENGM I VHI LSGKCMEAWQENNKDLYLRPC 
DGKARQQWRFDQ INAVDER 

Signal peptide: 

amino acids 1-28 
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FIGURE 2Q3 

CGCCAAGCATGCAGTAAAGGCTGAAAATCTGGGTCACAGCTGAGGAAGACCTCAGACATGGA 
GTCCAGGATGTGGCCTGCGCTGCTGCTGTCCCACCTCCTCCCTCTCTGGCCACTGCTGTTGC 
TGCCCCTCCCACCGCCTGCTCAGGGCTCTTCATCCTCCCCTCGAACCCCACCAGCCCCAGCC 
CGCCCCCCGTGTGCCAGGGGAGGCCCCTCGGCCCCACGTCATGTGTGCGTGTGGGAGCGAGC 
ACCTCCACCAAGCCGATCTCCTCGGGTCCCAAGATCACGTCGGCAAGTCCTGCCTGGCACTG 
CACCCCCAGCCACCCCATCAGGCTTTGAGGAGGGGCCGCCCTCATCCCAATACCCCTGGGCT 
ATCGTGTGGGGTCCCACCGTGTCTCGAGAGGATGGAGGGGACCCCAACTCTGCCAATCCCGG 
ATTTCTGGACTATGGTTTTGCAGCCCCTCATGGGCTCGCAACCCCACACCCCAACTCAGACT 
CCATGCGAGGTGATGGAGATGGGCTTATCCTTGGAGAGGCACCTGCCACCCTGCGGCCATTC 
CTGTTCGGGGGCCGTGGGGAAGGTGTGGACCCCCAGCTCTATGTCACAATTACCATCTCCAT 
CATCATTGTTCTCGTGGCCACTGGCATCATCTTCAAGTTCTGCTGGGACCGCAGCCAGAAGC 
GACG CAGACC CT CAGG GCAG CAAGGTGC CCTG AGGCAGGAGGAGAGCCAG C AGC CACTGACA 
GACCTGTCCCCGGCTGGAGTCACTGTGCTGGGGGCCTTCGGGGACTCACCTACCCCCACCCC 
TGACCATGAGGAGCCCCGAGGGGGACCCCGGCCTGGGATGCCCCACCCCAAGGGGGCTCCAG 
C CTT C CAGTTGAACCG GTGAGGGC AG GGGCAATGGGATGGGAGGGCAAAGAGGGAAGG CAAC 
TTAGGTCTTCAGAGCTGGGGTGGGGGTGCCCTCTGGATGGGTAGTGAGGAGGCAGGCGTGGC 
CTCCCACAGCCCCTGGCCCTCCCAAGGGGGCTGGACCAGCTCCTCTCTGGGAGGCACCCTTC 
CTTCTCCCAGTCTCTCAGGATCTGTGTCCTATTCTCTGCTGCCCATAACTCCAACTCTGCCC 
TCTTTGGTTTTTTCTCATGCCACCTTGTCTAAGACAACTCTGCCCTCTTAACCTTGATTCCC 
CCTCTTTGTCTTGAACTTCCCCTTCTATTCTGGCCTACCCCTTGGTTCCTGACTGTGCCCTT 
TCCCTCTTCCTCTCAGGATTCCCCTGGTGAATCTGTGATGCCCCCAATGTTGGGGTGCAGCC 
AAGCAGGAGGCCAAGGGGCCGGCACAGC CC C CATCC CZACTGAGGGTGGGG CAG CTGTGGGGA 
GCTGGGGCCACAGGGGCTCCTGGCTCCTGCCCCTTGCACACCACCCGGAACACTCCCCAGCC 
CCACGGGCAATCCTATCTGCTCGCCCTCCTGCAGGTGGGGGCCTCACATATCTGTGACTTCG 
GGTCCCTGTCCCCACCCTTGTGCACTCACATGAAAGCCTTGCACACTCACCTCCACCTTCAC 
AGGCCATTTGC^C^CGCTCCTGCACCCTCTCCCCGTCCATACCGCTCCGCTCAGCTGACTCT 
CATGTTCTCTCGTCTCACATTTGCACTCTCTCCTTCCGACATTCTGTGCTCAGCTCACTCAG 
TGGTCAGCGTTTCCTGCACACTTTACCTCTCATGTGCGTTTCCCGGCCTGATGTTGTGGTGG 
TGTGCGGCGTGCTCACTCTCTCCCTCATGAACACCCACCCACCTCGTTTCCGCAGCCCCTGC 
GTGCTGCTCCAGAGGTGGGTGGGAGGTGAGCTGGGGGCTCCTTGGGCCCTCATCGGTCATGG 
TCTCGTCCCATTCCACACCATTTGTTTCTCTGTCTCCCCATCCTACTCCAAGGATGCCGGCA 
TCACCCTGAGGGCTCCCCCTTGGGAATGGGGTAGTGAGGCCCCAGACTTCACCCCCAGCCCA 
CTGCT AAAATCT GTTTTCTGACAGATGGGT TTTGGGGAGT CG CCT G CTGCACTACATGAGAA 
AGGGACTCCCATTTGCCCTTCCCTTTCTCCTACAGTCCCTTTTGTCTTGTCTGTCCTGGCTG 
TCTGTGTGTGTGCCATTCTCTGGACTTCAGAGCCCCCTGAGCCAGTCCTCCCTTCCGAGCCT 
CCCTTTGGGCCTCCCTAACTCCACCTAGGCTGCCAGGGACCGGAGTCAGCTGGTTCAAGGCC 
ATCGGGAGCTCTGCCTCCAAGTCTACCCTTCCCTTCCCGGACTCCCTCCTGTCCCCTCCTTT 
CCTCCCTCCTTCCTTCCACTCTCCTTCCTTTTGCTTCCCTGCCCTTTCCCCCTCCTCAGGTT 
CTTCCCTCCTTCTCACTGGTTTTTCCACCTTCCTCCTTCCCTTCTTCCCTGGCTCCTAGGCT 
GTGATATATATTTTTGT AT TAT CTCT TT CTTCTT CTTGTGGTGATCAT CTTGAATTACTGTG 
GGATGTAAGTTTCAAAATTTTC AAATAAAG CCTTTG CAAGATAA 
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FIGURE 204 

></usr/seqdb2/sst/DNA/Dnaseqs . min/ss .DNA76393 
xsubunit 1 of 1, 243 aa, 1 stop 
><MW: 26266, pi: 8.43, NX (S/T) : 1 

MRPQGPAASPQRLRGLLLLLLLQLPAPS SASE I PKGKQKAQLRQREVVDLYNGMCLQGPAGV 
PGRDGSPGANVIPGTPGIPGRDGFKGEKGECLRESFEESWTPNYKQCSWSSLNYGIDLGKIA 
ECTFTKMRSNSALRVLFSGSLRLKCRNACCQRWYFTFNGAECSGPLPIEAIIYLDQGSPEMN 
STINIHRTSSVEGLCEGIGAGLVDVAIWVGTCSDYPKGDASTGWNSVSRIIIEELPK 

Signal peptide: 

amino acids 1-30 

Transmembrane domain: 

amino acids 195-217 
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FIGURE 205 

GTTAACCAGCGCAGTCCTCCGTGCGTCCCGCCCGCCGCTGCCCTCACTCCCGGCCAGG&SSG 
CATCCTGTCTGGCCCTGCGCATGGCGCTGCTGCTGGTCTCCGGGGTTCTGGCCCCTGCGGTG 
CTCACAGACGATGTTCCACAGGAGCCCGTGCCCACGCTGTGGAACGAGCCGGCCGAGCTGCC 
GT CGGGAGAAGG C C C CGTGGAGAG CACC AG C C CC GG CCGGGAGC CCGTGGACAC CGGT CC CC 
CAGCCCCCACCGTCGCGCCAGGACCCGAGGACAGCACCGCGCAGGAGCGGCTGGACCAGGGC 
GGCGGGTCGCTGGGGCCCGGCGCTATCGCGGCCATCGTGATCGCCGCCCTGCTGGCCACCTG 
CGTGGTGCTGGCGCTCGTGGTCGTCGCGCTGAGAAAGTTTTCTGCCTCC TGAA GCGAATAAA 
GGGGCCGCGCCCGGCCGCGGCGCGACTCGGCAAAAAAAAAAAAAAA 



WO 00/12708 
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FIGURE 206 

></usr/seqdb2 /sst /DNA/Dnaseqs . min/ss . DNA763 9 8 
xsubunit 1 of 1, 121 aa, l stop 
><MW: 12073, pi: 4.11, NX{S/T): 0 

MASCLALRMALLLVSGVLAPAVLTDDVPQEPVPTLWNEPAELPSGEGPVESTSPGREPVDTG 
PPAPTOAPGPEDSTAQERLDQGGGSLGPGAIAAIVIAALLATOTVI^ 

Important features of the protein: 
Signal peptide: 

amino acids 1-19 

Transmembrane domain: 

amino acids 91-110 

Glycosaminoglycan attachment site. 

amino acids 44-47 

cAMP- and cGMP- dependent protein kinase phosphorylation site. 

amino acids 116-119 

N-myristoylation site. 

amino acids 91-96 



269 /Z70 
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FIGURE 207 

GGCCGTTGGTTGGTGCGCGGCTGAAGGGTGTGGCGCGAGCAGCGTCGTTGGTTGGCCGGCGG 
CGGGCCGGGACGGGCATGGCCCTGCTGCTGTGCCTGGTGTGCCTGACGGCGGCGCTGGCCCA 
CGGCTGTCTGCACTGCCACAGCAACTTCTCCAAGAAGTTCTCCTTCTACCGCCACCATGTGA 
ACTTCAAGTCCTGGTGGGTGGGCGACATCC CC GTGT CAGGGGCG CTGCTCACCGACTGGAGC 
GACGACACGATGAAGGAGCTGCACCTGGCCATCCCCGCCAAGATCACCCGGGAGAAGCTGGA 
CCAAGTGGCGACAGCAGTGTACCAGATGATGGATCAGCTGTACCAGGGGAAGATGTACTTCC 
CCGGGTATTTCCCCAACGAGCTGCGAAACATCTTCCGGGAGCAGGTGCACCTCATCCAGAAC 
GCCATCAT CGAAAGGCAC CTGGCACCAGGCAGCTGGGGAGGAGGGCAGCTCTCCAGGGAGGG 
ACCCAGCCTAGCACCTGAAGGATCAATGCCATCACCCCGCGGGGACCTCCCCTAAGTAGCCC 
CCAGAGGCGCTGGGAGTGTTGCCACCGCCCTCCCCTGAAGTTTGCTCCATCTCACGCTGGGG 
GTCAACCTGGGGAC CC CT T CCCT C CGGG CCATGGACACACAT ACATGAAAACCAGGCCG CAT 
CGACTGTCAGCACCGCTGTGGCATCTTCCAGTACGAGACCATCTCCTGCAACAACTGCACAG 
ACTCGCACGTCGCCTGCTTTGGCTATAACTGCGAGTAGGGCTCAGGCATCACACCCACCCGT 
GCCAGGGCCCTACTGTCCCTGGGGTCCCAGGCTCTCCTTGGAGGGGGCTCCCCGCCTTCCAC 
CTGGCTGTCATCGGGTAGGGCGGGGCCGTGGGTTCAGGGGCGCACCACTTCCAAGCCTGTGT 
CCCACAGGTCCTCGGCGCAGTGGAAGTCAGCTGTCCAGGGCCTCCTGAACTACATAAATAAC 
TGGCACAAGTAAGTCCCCTCCTCAAACCAACACAGGCAGTGTGTGTATGTGAGCACCTCGTG 
GGTGAGTATGTGTGGGGCACAGGCTGGCTCCCTCAGCTCCCACGTCCTAGAGGGGCTCCCGA 
GGAGGTGGAACCTCAACCCAGCTCTGCGCAGGAGGCGG CTGCAGTC CTTTTCTC CCTCAAAG 
GTCTCCGACCCTCAGCTGGAGGCGGGCAT CTTTCCTAAAGGGTC CC CATAGGGT CTGGTTCC 
ACCCCATCCCAGGTCTGTGGTCAGAGCCTGGGAGGGTTCCCTACGATGGTTAGGGGTGCCCC 
ATGGAGGGGCTGACTGCCC CAC ATTGCCTTT C AGACAGGACACG AG CATGAGGTAAGG CCGC 
CCTGACCTGGACTTCAGGGGGAGGGGGTAAAGGGAGAGAGGAGGGGGGCTAGGGGGTCCTCT 
AGATCAGTGGGGGCACTGCAGGTGGGGCTCTCCCTATACCTGGGACACCTGCTGGATGTCAC 
CTCTGCAACCA(IACCCATGTGGTGGTTTCATGAACAGACCACGCTCCTCTGCCTTCTCCTGG 
C CTGGGACACACAGAG CC AC CCCGGCCT TGTGAGTGAC C CAGAGAAGGGAGGC CT CGGGAGA 
AGGGGTGCTCGTAAGCCAACACCAGCGTGCCGCGGCCTGCACACCCTTCGGACATCCCAGGC 
ACGAGGGTGT CGTGGATGTGGCCACACATAGGAC CACACGT CCCAGCTGGGAGGAGAGGC CT 
GGGGC CCC CAGGGAGGGAGG CAGGGGGTGGGGGACATGGAGAGCTGAGGCAG CCTCGTCTC C 
CCGCAGCCTGGTATCGCCAGCCTTAAGGTGTCTGGAGCCCCCACACTTGGCCAACCTGACCT 
TGGAAGATGCTG CTGAGTGT CT CAAGCAGCACTGACAGCAGCTGGGCCTGC C CC AGGGCAAC 
GTGGGGGCGGAGACTCAGCTGGACAGCCCCTGCCTGTCACTCTGGAGCTGGGCTGCTGCTGC 
CT CAGGAC CC CC TCTC CGACC CCGGACAGAGCTGAGCTGG C CAG GGCCAGGAGGG CGGGAGG 
GAGGGAATGGGGGTGGGCTGTGCGCAGCATCAGCGCCTGGGCAGGTCCGCAGAGCTGCGGGA 
TGTGATTAAAGTCCCTGATGTTTCTC 
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FIGURE 208 

></usr/seqdb2/sst/DNA/Dnaseqs .min/ss . DNA76399 
xsubunit 1 of 1, 157 aa, 1 stop 
><MW: 17681, pi: 7.65, NX(S/T): 1 

MALLLCLVCLTAALAHGCLHCH SNF S KKF S FYRHHVNF KS WWVGD I P VSGALLTDWSDDTMK 
ELHLAI PAKiTREKLDQVATAVYQMMDQLYQGKMYFPGYFPNELRNIFREQVHLIQNAIIER 
HLAPGS WGGGQLSREGPSLAPEGSMPS PRGDLP 

Signal peptide: 

amino acids 1-15 
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FIGURE 209 

AGCAGGAGCAGGAGAGGGACAATGGAAGCTQCCCCGTCCAGGTT CATGTT CCTCTTATTTCT 
C CTCACGTGTGAG CTGGCTGCAGAAGTTGCTGCAGAAGT TGAGAAATC CT CAGATGGT CCTG 
GTGCTGCCCAGGAACCCACGTGGCTCACAGATGTCCCAGCTGCCATGGAATTCATTGCTGCC 
ACTGAGGTGG CTGTCAT AGGCTT C TT CCAGGATTTAGAAATACCAG CAGTG C CC ATACT CCA 
TAG CATGGTG CAAAAATTC C CAGG CGTGTCATTT GGGATCAG CACTGATTCTGAGGT TCTGA 
CACACTACAACATCACTGGGAACACC AT CTGC CT CTTTCGCCTGGTAGACAATGAACAACTG 
AATTTAGAGGACGAAGACATTGAAAGCATTGATGCCACCAAATTGAGCCGTTTCATTGAGAT 
CAACAGC C TC CAGATGGT GACAGAGT ACAAC C CTGTGACTGTGATTGGGTTATTCAACAG CG 
TAAT TCAG ATT CATC TCCTC CTGATAATGAACAAGGCCT CC C CAGAGT ATG AAGAGAACATG 
CACAGATACCAGAAGGCAGCCAAGCTCTTCCAGGGGAAGATTCTCTTTATTCTGGTGGACAG 
TGGTATG AAAGAAAATGGGAAGGTGATATCAT TTTTCAAACTAAAGGAGT CT C AACTG C CAG 
CTTTGGCAATTTACCAGACTCTAGATGACGAGTGGGATACACTGCCCACAGCAGAAGTTTCC 
GT AGAGCATGTG CAAAACTTTT GTGATGGATT C CTAAGTGGAAAATTGTTGAAAGAAAAT CG 
TG AAT CAGAAGGAAAGACT C CAAAGGTGGAACT CTg&CTT C TC CTTGGAACTACATATGGC C 
AAGTATCTACTTTATGCAAAGTAAAAAGGCACAACTCAAATCTCAGAGACACTAAACAACAG 
GATCACTAGGCCTGCC^CCACACACACACGCACGTGCACACACGCACGCACGCGTGCACAC 
ACACACGCGCACACACAC AC ACACACAGAGCTTCATTTCCTGT CTTAAAAT CTCGTTTT CTC 
TTCTTCCTTCTTTTAAATTTCATATCCTCACTCCCTATCCAATTTCCTTCTTATCGTGCATT 
(^TACTCTGTAAGCCCATCTGTAACACACCTAGATCAAGGCTTTAAGAGACTCACTGTGATG 
CCTCTATG AAAGAGAGG CATT C CT AGAGAAAG ATTGTT C CAATTTGTCATTTAATAT CAAGT 
TTGTAT ACTG CACATGACTT AC AC ACAACATAGTT CCTGCT CTTTTAAGGT TACCT AAGGGT 
TGAAACTCTACCTTCTTTCATAAGCACATGTCCGTCTCTGACTCAGGATCAAAAACCAAAGG 
ATGGTTTTAAAC^CCTTTGTGAAATTGTCTTTTTGCCAGAAGTTAAAGGCTGTCTCCAAGTC 
CCTGAACTCAGCAGAAATAGACCATGTGAAAACTCCATGCTTGGTTAGCATCTCCAACTCCC 
TAT GTAAATCAACAAC CTG CATAATAAATAAAAGG CAAT CATGTTATA 
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FIGURE 210 

></usr/seqdb2/sst/DNA/Dnaseqs .min/ss .DNA764 01 
xsubunit 1 of 1, 273 aa, 1 stop 
><MW: 30480, pi: 4.60, NX(S/T): 1 

MEAAPSRFMFLLFLLTCELAAEVAAEV2KSSDGPGAAQEPTWLTDVPAAMEFIAATEVAVIG 
FFQDLE I PAVP I LHSMVQKFPGVSFG IS TDSEVLTHYNI TGNT I CLFRLVDNEQLNLEDEDI 
ES IDATKLSRFI EINSLHMVTEYNPVTVIGLFNSVIQIHLLLIMNKASPEYEENMHRYQKAA 
KLFQGKILFILVDSGMKENGKVISFFKLKESQLPALAIYQTLDDETOTLPTAEVSVEHVQNF 
CDGFLSGKLLKENRESEGKTPKVEL 

Signal peptide: 

amino acids 1-20 

Transmembrane domain: 

amino acids 143-162 



2/3/170 
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FIGURE 211 

GGAGAGCCGCGGCTGGGACCGGAGTGGGGAGCGCGGCGTGGAGGTGCCACCCGGCGCGGGTG 
GCGGAGAGATCAGAAGCCTCTTCCCCAAGC CG AG CCAACCT CAGCGGGGACC CGGGCTCAGG 
GACGCGGCGGCGGCGG03GCGACTGCAGTGGCTGGACGATGGCAGCGTCCGCCGGAGCCGGG 
GCGGTGATTGCAGCCCCAGACAGCCGGCGCTGGCTGTGGTCGGTGCTGGCGGCGGCGCTTGG 
G CT CTTGACAGCTGGAGTATCAG C CTTGGAAGTATATACG CC AAAAGAAATCTTCGTGG CAA 
ATGGTACACAAGGGAAGCT GAC CTGCAAGT TCAAGT CT AC TAGT ACGACTGG CGGGTTGACC 
TCAGTCTCCTGGAGCTTCCAGCCAGAGGGGGCCGACACTACTGTGTCGTTTTTCCACTACTC 
CCAAGGGCAAGTGTACCTTGGGAATTATCCACCATTTAAAGACAGAATCAGCTGGGCTGGAG 
AC CTTGAC AAGAAAGATG CATCAATCAACATAGAAAAT AT GC AGTTTATACACAATGG CACC 
TATATCTGTGATGTCAAAAACCCTCCTGACATCGTTGTCCAGCCTGGACACATTAGGCTCTA 
TGTC GTAG AAAAAGAGAATTTGCC TG TGTTTC CAGTTTGGGTAGTGGTGGGCATAGTTACTG 
C TGTGGTC CTAGGT CT CACT CTG CTC AT CAGCATGATTCTGGCTGTC CT CTATAGAAGGAAA 
AACTCTAAACGGGATTACACTGGCTGCAGTACATCAGAGAGTTTGTCACCAGTTAAGCAGGC 
TCCTCGGAAGTCCCCCTCCGACACTGAGGGTCTTGTAAAGAGTCTGCCTTCTGGATCTCACC 
AGGG CC CAGT CAT ATATGCACAGTTAGACCACTCCGG CGGAC AT CACAGTGACAAG ATTAAC 
AAGT C AGAGT CTGTGGT GTATGCG GATATCCGAAAGAATTAAGAGAAT AC CTAG AACATAT C 
CTCAGCAAGAAACAAAACCAAACTGGACTCTCGTGCAGAAAATGTAGCCCATTACCACATGT 
AGCCTTGGAGACCCAGGCAAGGACAAGTACACGTGTACTCACAGAGGGAGAGAAAGATGTGT 
ACAAAGGATATGTATAAATATTCT ATTTAGTCAT CC TG AT ATGAGGAG CC AGTGTTGCATGA 
TGAAAAGATGGTATGATTCTACATATGTACCCATTGTCTTGCTGTTTTTGTACTTTCTTTTC 
AGGTCATTT ACAATTGGGAGATTT C AGAAACATT CCTTT CAC CAT C ATTT AGAAATGGTTTG 
CCTTAATGGAGACAATAGCAGATCCTGTAGTATTTCCAGTAGACATGGCCTTTTAATCTAAG 
GGCTTAAGACTGATTAGTCTTAGCATTTACTGTAGTTGGAGGATGGAGATGCTATGATGGAA 
GCATACCCAGGGTGGC CTTTAGCACAGTAT CAGTACCATTTATT TGTCTGCCGCTTTTAAAA 
AATACCCATTGGCTATGCCACTTGAAAACAATTTGAGAAGTTTTTTTGAAGTTTTTCTCACT 
AAAATATGGGGCAATTGTTAGCCTTACATGTTGTGTAGACTTACTTTAAGTTTGCACCCTTG 
AAATGTGT CATAT C AATTT CTGGATT C ATAATAGCAAG ATTAGCAAAGGATAAATGC CGAAG 
GTCACTTCATTCTGGACACAGTTGGATCAATACTGATTAAGTAGAAAATCCAAGCTTTGCTT 
GAGAACTTTTGTAACGTGGAGAGTAAAAAGTATCGGTTTTA 
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FIGURE 212 

></usr/seqdb2/sst/DNA/Dnaseqs .min/ss .DNA76510 
xsubunit 1 of 1, 269 aa, 1 stop 
><MW: 29082, pi: 9.02, NX(S/T): 3 

MAASAGAGAVIAAPDSRRWLWSVLAAALGLLTAGVS ALEVYTPKE I FVANGTQGKLTCKFKS 
TSTTGGLTSVSWSFQPEGADTTVS FFHYSQGQVYLGNYPP FKDRI S WAGDLDKKDAS INIEN 
MQ F IHNGTYI CDVKNPPD I WQPGHIRLYWEKENLPVFPVWVWGIVTAWLGLTLL I SM I 
LAVLYRRKNSKRDYTGCSTSESLSPVKQAPRXSPSDTEGLVKSLPSGSHQGPVIYAQLDHSG 
GHHSDKINKSESWYADIRKN 

Signal peptide: 

amino acids 1-3 7 

Transmembrane domain: 

amino acids 161-183 



-2/S/2 7d 
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FTGTJRE 213 

GCCGGCTGTGCAGAGACGCCATGTACCGGCTCCTGTCAGCAGTGACTGCCCGGGCTGCCGCC 
CCCGGGGGCTTGGCCTCAAGCTGCGGACGACGCGGGGTCCATCAGCGCGCCGGGCTGCCGCC 
TCTCGGCCACGGCTGGGTCGGGGGCCTCGGGCTGGGGCTGGGGCTGGCGCTCGGGGTGAAGC 
TGGCAGGTGGGCTGAGGGGCGCGGCCCCGGCGCAGTCCCCCGCGGCCCCCGACCCTGAGGCG 
TCGCCTCTGGCCGAGCCGCCACAGGAGCAGTCCCTCGCCCCGTGGTCTCCGCAGACCCCGGC 
GCCGCCCTGCTCCAGGTGCTTCGCCAGAGCCATCGAGAGCAGCCGCGACCTGCTGCACAGGA 
T CAAGGATGAGGTGGGCG CAC CGGGCATAGTGGTTGGAGTTT CTG TAGATGGAAAAGAAGT C 
TGGTC AGAAGGTTT AGGTTATGCT GATG TT GAGAAC CGTGTAC CATGTAAACCAGAGACAGT 
TATGCGAATTGCTAGCATCAGCAAAAGTCTCACCATGGTTGCTCTTGCCAAATTGTGGGAAG 
CAGGGAAA CTGG AT CT TGATAT T C CAGTACAACATTATGTT C CCGAATTC CCAGAAAAAGAA 
TATGAAGGT GAAAAGGTT TCTGT C ACAACAAGATT ACTGATTTC CCATTT AAGTGGAATT CG 
TCATTATGAAAAGGACATAAAAAAGGTGAAAGAAGAGAAAGCTTATAAAGCCTTGAAGATGA 
TG AAAGAGAATGTTGCATTTGAGCAAGAAAAAGAAG GCAAAAGT AAT GAAAAGAAT GATTTT 
ACTAAATTTAAAACAGAG CAGGAGAATGAAGC CAAATG CC GGAATT CAAAAC CTGG CAAGAA 
AAAGAATGATTTTGAAeAAGGCGAATTATATTTGAGAGAAAAGTTTGAAAATTCAATTGAAT 
CCCTAAGATTATTTAAAAATGATCCTTTGTTCTTCAAACCTGGTAGTCAGTTTTTGTATTCA 
ACTTTTGG CTATAC CCT ACTGGCAGC CATAGT AGAGAGAG CTT C AGGATGTAAATATTTGGA 
CTATATGCAGAAAATATTCCATGACTTGGATATGCTGACGACTGTGCAGGAAGAAAACGAGC 
CAGT GATTTACAATAG AG CAAGGTAAATGAAT AC CTTCTGCTGTGT CTAGCTATAT CGCATC 
T TAACACTAT TT TATT AATT AAAAG T CAAATTTT CTTTGTTTC CATT CCAAAAT CAACCTG C 
CACATTTTGGGAGCTTTTCTACATGTCTGTTTTCTCATCTGTAAAGTGAAGGAAGTAAAACA 
TGTTTATAAAGTAAAAAAA 



X/f/2 7& 
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FIGURE 214 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss .DNA76522 
xsubunit 1 of 1, 373 aa, 1 stop 
><MW: 41221, pi: 8.54, NX(S/T): 0 

MYRLLSAVTARAAAPGGLAS S CGRRGVHQRAGLP PLGHGWVGGLGLGLiGLALiGVKLAGGLRG 

AAPAQSPAAPDPEASPLAEPPQEQSLAPWSPQTPAPPCSRCFARAIESSRDLLHRIKDEVGA 

PGIWGVSVDGKEWSEGLGYADVENRVPCKPETVMRIASISKSLTMVA1AKLWEAGKLDLD 

IPVQHYVPEFPEKEYEGEKVSVTTRLLISHLSGIRHYEKDIKKVKEEKAYKALKMMKE 

EQEKEGKSNEKNDFTKFKTEQENEAKCRNSKPGKKKNDFEQGELYLREKFENSIESLRLFKN 

DPLFFKPGSQFLYSTFGYTLLAAIVERASGCKYLDYMQKIFHDIJDMLTTVQEENEPVIYNRAR 

Signal peptide: 

amino acids 1-19 

Transmembrane domain: 

amino acids 39-60 
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FIGURE 215 

GTGACACTATAGAAGAGCTATGACGTCGCATGCACGCGTACGTAAGCTCGGAATTCGGCTCG 
AGGCTGGTGGGAAGAAGCCGAG&3SGCGGCAGCCAGCGCTGGGGCAACCCGGCTGCTCCTGC 
TCTTGCTGATGGCGGTAGCAGCGCCCAGTCGAGCCCGGGGCAGCGGCTGCCGGGCCGGGACT 
GGTGCGCGAGGGGCTGGGGCGGAAGGTCGAGAGGGCGAGGCCTGTGGCACGGTGGGGCTGCT 
GCTGGAGCACTCATTTGAGATCGATGACAGTGCCAACTTCCGGAAGCGGGGCTCACTGCTCT 
GGAACCAGCAGGATGGTACCTTGTCCCTGTCACAGCGGCAGCTCAGCGAGGAGGAGCGGGGC 
CGACTCCGGGATGTGGCAGCCCTGAATGGCCTGTACCGGGTCCGGATCCCAAGGCGACCCGG 
GGCCCTGGATGGCCTGGAAGCTGGTGGCTATGTCTCCTCCTTTGTCCCTGCGTGCTCCCTGG 
TGGAGTCGCACCTGTCGGACCAGCTGACCCTGCACGTGGATGTGGCCGGCAACGTGGTGGGC 
GTGTCGGTGGTGACGCACCCCGGGGGCTGCCGGGGCCATGAGGTGGAGGACGTGGACCTGGA 
GCTGTTCAACACCTCGGTGCAGCTGCAGCCGCCCACCACAGCCCCAGGCCCTGAGACGGCGG 
CCTTCATTGAGCGCCTGGAGATGGAACAGGCCCAGAAGGCCAAGAACCCCCAGGAGCAGAAG 
TCCTTCTTCGCCAAATACTGGATGTACATCATTCCCGTCGTCCTGTTCCTCATGATGTCAGG 
AGCGCCAGACACCGGGGGCCAGGGTGGGGGTGGGGGTGGGGGTGGTGGTGGGGGTAGTGGCC 
TTTGCTGT GTGCCACCCT CCCTGTAAGT CT ATTT AAAAACAT CGACGATACATTGAAATGTG 
TGAACGTTTTGAAAAGCTACAGCTTCCAGCAGCCAAAAGCAACTGTTGTTTTGGCAAGACGG 
TCCTGATGTACAAGCTTGATTGAAATTCACTGCTCACTTGATACGTTATTCAGAAACCCAAG 
GAATGGCTGTCCCCATCCTCATGTGGCTGTGTGGAGCTCAGCTGTGTTGTGTGGCAGTTTAT 
TAAACTGTC CC CCAGAT CGACACG CAAAAAAAAA 
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></usr/seqdb2/sst/DNA/Dnaseqs .min/ss .DNA76529 
xsubunit 1 of 1, 26 9 aa, 1 szop 
><MW: 28004, pi: 5.80, NX(S/T): 1 

MAAASAGATRLLLLLL^VAAPSRARGSGCRAGTGARGAGAEGREGEACGTVGLLLEHSFEI 
DDSANFRKRGSLLWNQQDGTLSLSQRQLSEEERGRLRDVAALNGLYRVRIPRRPGALDGIjEA 
GGYVSSFVPACSLVESHLSDQLTLHVDVAGNWGVSVVTHPGGCRGHEVEDVDLELFNTSVQ 
L Qp PTTAPGPETAAF I ERLEMEQAQKAKKPQEQKSFFAKYWM Y 1 1 PWLFLMMSGAPDTGGQ 
GGGGGGGGGGGSGLCCVPPSL 



Signal peptide: 

amino acids 1-24 



Transmembrane domain: 

amino acids 226-243 
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FIGURE 217 

GGAGCGCTGCTGGAACCCGAGCCGGAGCCGGAGCCACAGCGGGGAGGGTGGCCTGGCGGCCT 
GGAGCCGGACGTGTCCGGGGCGTCCCCGCAGACCGGGGCAGCAGGTCGTCCGGGGGCCCACC 
AIGCTGGTGACTGCCTACCTTGCTTTTGTAGGCCTCCTGGCCTCCTGCCTGGGGCTGGAACT 
GTCAAGATGCCGGGCTAAACCCCCTGGAAGGGCCTGCAGCAATCCCTCCTTCCTTCGGTTTC 
AACTGGACTTCTATCAGGTCTACTTCCTGGCCCTGGCAGCTGATTGGCTTCAGGCCCCCTAC 
CTCTATAAACTCTACCAGCATTACTACTTCCTGGAAGGTCAAATTGCCATCCTCTATGTCTG 
TGG C CT TG CC T CTACAGT C CTCTTTGGC CT AGTGGC CT C CTC CCTTGTGGATTGGCTGGGT C 
GCAAGAATTCTTGTGTCCTCTTCTCCCTGACTTACTCACTATGCTGCTTAACCAAACTCTCT 
CAAGACTACTTTGTGCTGCTAGTGGGGCGAGCACTTGGTGGGCTGTCCACAGCCCTGCTCTT 
CTCAGCCTTCGAGGCCTGGTATATCCATGAGCACGTGGAACGGCATGACTTCCCTGCTGAGT 
GGATCCCAGCTACCTTTGCTCGAGCTGCCTTCTGGAACCATGTGCTGGCTGTAGTGGCAGGT 
GTGGCAGCTGAGGCTGTAGCCAGCTGGATAGGGCTGGGGCCTGTAGCGCCCTTTGTGGCTGC 
CATCCCTCTCCTGGCTCTGGCAGGGGCCTTGGCCCTTCGAAACTGGGGGGAGAACTATGACC 
GGCAGCGTGCCTTCTCAAGGACCTGTGCTGGAGGCCTGCGCTGCCTCCTGTCGGACCGCCGC 
GTG CTGCTGCTGGGCACCATACAAGCTCTATTTGAGAGTGTCATCTTCAT CTTTGTCTTCCT 
CTGGACACCTGTGCTGGACCCACACGGGGCCCCTCTGGGCATTATCTTCTCCAGCTTCATGG 
CAGCCAGCCTGCTTGGCTCTTCCCTGTACCGTATCGCCACCTCCAAGAGGTACCACCTTCAG 
CCCATGCACCTGCTGTCCCTTGCTGTGCTCATCGTCGTCTTCTCTCTCTTCATGTTGACTTT 
CTCT AC CAGC CC AGGC CAGG AGAGT C CGGTGG AGT CCTTCAT AGC CTTTCTACTT ATTGAGT 
TGGCTTGTGGATTATACTTT C C CAG C ATGAGCTTCCTACGG AGAAAGGTG ATCC CTGAGACA 
GAGCAGGCTGGTGTACTCAACTGGTTCCGGGTACCTCTGCACTCACTGGCTTGCCTAGGGCT 
CCTTGTCCTCCATGACAGTGATCGAAAAACAGGCACTCGGAATATGTTCAGCATTTGCTCTG 
CTGTCATGGTGATGGCTCTGCTGGCAGTGGTGGGACTCTTCACCGTGGTAAGGCATGATGCT 
GAGCTGCGGGTACCTTCACCTACTGAGGAGCCCrATGCCCCrGAGCTGTAACCCCACTCCAG 
GACAAGATAG CTGGGACAGACTCTTGAATT CCAGCTATC CGG GATTGTA C AGAT CT CT CTGT 
GACTGACTTTGTGACTGTCCTGTGGTTTCTCCTGCCATTGCTTTGTGTTTGGGAGGACATGA 
TGGGGGTGATGGACTGGAAAGAAGGTGC CAAAAGTT CCCT CTGTGTTACTCCCATTTAGAAA 
ATAAACACTTTTAAATGATCAAAAAAAAAAAA 
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FIGURE 218 

MLVTAYWVGLIASCLGLELSRCRAKPFGRACSNPSFLRFQLDFYQVYFIALAADWLQAPY 
LYKLYQHYYFLEGQ IAILYVCGLASTVLFGLVASSLVDWLGRKNSCVLFSLTYSLCCLTKLS 
QDYFVLLVGRALGGLSTALLFSAFEAWYIHEHVERHDFPAEWIPATFARAAFWNHVLAVVAG 
VAAEAVASWI GLGPVAPFVAAI PLLALA^LALRNWGENYDRQRAFSRTCAGGLRCLLSDRR 
VLLLGTIQALFESVIFIFVFLWTPVLDPHGAPLGIIFSSFMAASLLGSSLYRIATSKRYHLQ 
PMHLLSLAVLIWFSLFMLTFSTSPGQESPVESFIAFLLIELACGLYFPSMSFLRRKVIPET 
EQAGVLNWFRVPLHSLACLGLLVLHDSDRKTGTRNMFS I CSAVMVMALLAWGLFTWRHDA 
ELRVPSPTEEPYAPEL 

Signal peptide: 

amino acids 1-18 

Transmembrane domain: 

amino acids 41-55, 75-94, 127-143, 191-213, 249-270, 278-299, 
314-330, 343-359, 379-394, 410-430 
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FIGURE 219 

GCGACGCGCGGCGGGGCGGCGAGAGGAAACGCGGCGCCGGGCCGGGCCCGGCCCTGGAGATG 
GTCCCCGGCGCCGCGGGCTGGTGTTGTCTCGTGCTCTGGCTCCCCGCGTGCGTCGCGGCCCA 
CGGCTT CC GTATC CATGATTATTTGTACTTT CAAGTG C TGAGTC CTGGGGACAT TCG ATACA 
TCTTCACAGCCACACCTGCCAAGGACTTTGGTGGTATCTTTCACACAAGGTATGAGCAGATT 
CACCTTGTCCCCGCTGAACCTCCAGAGGCCTGCGGGGAACTCAGCAACGGTTTCTTCATCCA 
GGACCAGATTGCTCTGGTGGAGAGGGGGGGCTGCTCCTTCCT CT CCAAGACT CGGGTGGTCC 
AGGAGC^CGGCGGGCGGGCGGTGATCATCTCTGACAACGCAGTTGACAATGACAGCTTCTAC 
GTGG AGATGAT C CAGG AC AGTAC C CAG CGC AC AGCTGACATC C C CG C C CTC TT C CTGCT CGG 
CCGAGACGGCTACATGATCCGCCGCTCTCTGGAACAGCATGGGCTGCCATGGGCCATCATTT 
CCATCCCAGTCAATGTCACCAGCATCCCCACCTTTGAGCTGCTGCAACCGCCCTGGACCTTC 
TGGTAGAAGAGTTTGTCCCACATTCCAGCCATAAGTGACTCTGAGCTGGGAAGGGGAAACCC 
AGGAATTTTGCTACTTGGAATTTGGAGATAGCATCTGGGGACAAGTGGAGCCAGGTAGAGGA 
AAAGGGTTTGGGCGTTGCTAGGCTGAAAGGGAAGCCACACCACTGGCCTTCCCTTCCCCAGG 
GCCCCCAAGGGTGTCTCATGCTACAAGAAGAGGCAAGAGACAGGCCCCAGGGCTTCTGGCTA 
GAACCCGAAACAAAAGGAGCTGAAGGCAGGTGGCCTGAGAGCCATCTGTGACCTGTCACACT 
CACCTGGCTCCAGCCTCCCCTACCCAGGGTCTCTGCACAGTGACCTTCACAGCAGTTGTTGG 
AGTGGTTTAAAGAGCTGGTGTTTGGGGACTCAATAAACCCTCACTGACTTTTTAGCAATAAA 
GCTTCTCATCAGGGTTGCAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 220 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA76532 
xsubunit 1 of 1, 188 aa, 1 stop 
><MW: 21042, pi: 5.36, NX(S/T): 2 

MVPGAAGWCCLVLWLPACVAAHGFRIHDYLYFQVLSPGDIRYIFTATPAKDFGGIFHTRYEQ 
IHLVPAEPPEACGELSNGFFIQDQIALVERGGCSFLSKTRWQEHGGRAVIISDNAVDNDSF 
YVEMI QDSTQRTADI PALFLLGRDGYMIRRSLEQHGLPWAI IS I PVNVTS I PTFELLQPPWTFW 

Signal peptide: 

amino acids 1-20 



JZ33>276 
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FIGURE 221 

TCTGCCTCC^CTGCTCTGTGCTGGGATCATGGAACTTGCACTGCTGTGTGGGCTGGTGGTGA 
TGGCTGGTGTGATTCCAATCCAGGGCGGGATCCTGAACCTGAACAAGATGGTCAAGCAAGTG 
ACTGGGAAAATGCCCATCCTCTCCTACTGGCCCTACGGCTGTCACTGCGGACTAGGTGGCAG 
AGGCCAACCCAAAGATGCCACGGACTGGTGCTGCCAGACCCATGACTGCTGCTATGACCACC 
TGAAGACC CAGGGGTGCGGC AT CTACAAGGACAACAAC AAAAGCAG CATA CATTGTATGGAT 
TTATCTCAACGCTATTGTTTAATGGCTGTGTTTAATGTGATCTATCTGGAAAATGAGGACTC 
CGA ATAA AAAGC T ATTACTAWT TNAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA^ 



WO 00/12708 PCT/US99/20U1 

FIGURE 222 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA76538 
xsubunit 1 of 1, 116 aa, 1 stop 
><MW: 12910, pi: 6.41, NX(S/T): 1 
MELALLCGLVVMAGVIPI<^GILNLNKMVKQV^ 

CCQTHDCCYDHLKTQGCGIYKDNNKSSIHCMDLSQRYCLMAVFNVIYLENEDSE 

Important features of the protein: 
Signal peptide: 
amino acids 1-17 

Transmembrane domain: 

amino acids 1-24 

N-glycosylation site. 

amino acids 86-8 9 

N-myristoylation sites. 

amino acids 20-25, 45-50 

Phospholipase A2 histidine active site. 

amino acids 63-70 
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FIGURE 223 

CT CG CTT CTTCCTT CTGGATGGGG G CC CAGGG GG C CCAGG AGAGTATAAAGG CGAT G TGGAG 
GGTGCCCGGCACAACCAGACGCCCAGTCACAGGCGAGAGCCCTGGGATGCACCGGCCAGAGG 
CCATGCTGCTGCTGCTCACGCTTGCCCTCCTGGGGGGCCCCACCTGGGCAGGGAAGATGTAT 
GGCCCTGGAGGAGGCAAGTATTTCAGCACCACTGAAGACTACGACCATGAAATCACAGGGCT 
GCGGGTGTCTGTAGGTCTTCTCCTGGTGAAAAGTGTCCAGGTGAAACTTGGAGACTCCTGGG 
ACGTGAAACTGGGAGCCTTAGGTGGGAATACCCAGGAAGT CACC CTGCAGCCAGGCGAATAC 
ATCACAAAAGTCTTTGTCGCCTTCCAAGCTTTCCTCCGGGGTATGGTCATGTACACCAGCAA 
GGACCGCTATTTCTATTTTGGGAAGCTTGATGGCCAGATCTCCTCTGCCTACCCCAGCCAAG 
AGGGGCAGGTGCTGGTGGGCATCTATGGCCAGTATCAACTCCTTGGCATCAAGAGCATTGGC 
TTTG AATGGAATTATC C ACT AG AGGAGC CGAC C ACTG AGC CACCAGTT AATCT CACATACT C 
AGCAAACTCACCCGTGGGTCGCTAGGGTGGGGTATGGGGCCATCCGAGCTGAGGCCATCTGT 
GTGGTGGTGGCTGATGGTACTGGAGTAACTGAGTCGGGACGCTGAATCTGAATCCACCAATA 
AATAAAGCTTCTGCAGAAAA 
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FIGURE 224 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA76541 
xsubunit 1 of 1, 178 aa f 1 stop 
><MW: 19600, pi: 5.89, HX(S/T): 1 

MHRPEAMLLLLTLALLGGPTWAGKMYGPGGGKYFSTTEDYDHEITGLRVSVGLLLVKSVQVK 
LGDSWDVKLGALGGNTQEVTLQPGEYITKVFVAFQAFLRGMVMYTSKDRYFYFGKLDGQISS 
AY PS QEGQ VL VG I YGQ YQLLG I KS I G F E WNY PLE E PTTE P PVNL T Y SANS P VGR 

Signal peptide: 

amino acids 1-22 
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FIGURE 225 

GCTGAGCGTGTGCGCGGTACGGGGCTCTCCTGCCTTCTGGGCTCCAACGCAGCTCTGTGGCT 
GAACTGGGTGCTCATCACGGGAACTGCTGGGCTATGGAATACAGATGTGGCAGCTCAGGTAG 
CCCCAAATTGCCTGGAAGAATACATCATGTTTTT CGATAAGAAGAAATTGTAGGATCCAGTT 
TTTTTTTTAACCGCCC C CTC CCCACC C C CC AAAAAAACTGTAAAG ATGCAAAAACGTAATAT 
CCATGAAGATCCTATTACCTAGGAAGATTTTGATGTTTTGCTGCGAATGCGGTGTTGGGATT 
TATTTGTTCTTGGAGTGTTCTGCGTGGCTGGCAAAGAATAATGTTCCAAAATCGGTCCATCT 
CCCAAGGGGTCCAATTTTTCTTCCTGGGTGTCAGCGAGCCCTGACTCACTACAGTGCAGCTG 
ACAGGGGCTGTCATGCAACTGGCCCCTAAGCCAAAGCAAAAGACCTAAGGACGACCTTTGAA 
CAATACAAAGGATGGG TTTCAATGTAATTAGG CTAC TGAGCGG ATCAG CTGTAGCACTGGTT 
ATAGCCCCCACTGTCTTACTGACAATGCTTTCTTCTGCCGAACGAGGATGCCCTAAGGGCTG 
TAGGTGTG AAGG C AAAATGG TATATTGTGAAT CTCAGAAATTACAGGAGAT ACC CTCAAGT A 
TATCTGCTGGTTGCTTAGGTTTGTCCCTTCGCTATAACAGCCTTCAAAAACTTAAGTATAAT 
CAATTTAAAGGG CTCAACCAGCT CAC CTGG CT ATACCTTGAC CATAAC CATATCAG CAATAT 
TG ACGAAAATGC TTTTAATGGAATACGCAG ACTCAAAGAG CTGATT CT TAGTTCCAATAGAA 
TCTCCTATTTTCTTAACAATACCTTCAGACCTGTGACAAATTTACGGAACTTGGATCTGTCC 
TATAATCAGCTGCATTCTCTGGGATCTGAACAGTTTCGGGGCTTGCGGAAGCTGCTGAGTTT 
ACATTTACGGTCTAACTCCCTGAGAACCATCCCTGTGCGAATATTCCAAGACTGCCGCAACC 
TGGAACTTTTGGACCTGGGATATAACCGGATC CGAAGTTTAGCCAGGAATGT CTTTGCTGGC 
ATGATCAGACT CAAAGAACTT CACCTGG AG CACAAT CAATTT TC CAAG CT CAAC CTGG CCCT 
TTTTCCAAGGTTGGTCAGCCTTCAGAACCTTTACTTGCAGTGGAATAAAATCAGTGTCATAG 
GACAGACCATGT CCTGGACCTGGAGCTCCTT A CAAAGG CTTGATTTAT CAGG CAATGAGATC 
GAAGCTTTCAGTGGACCCAGTGTTTTCCAGTGTGTCCCGAATCTGCAGCGCCTCAACCTGGA 
TTCC^C^GCTCACATTTATTGGTCAAGAGATTTTGGATTCTTGGATATCCCTC^ATGACA 
TCAGTCTTGCTGGGAATATATGGGAATGCAGCAGAAATATTTGCTCCCTTGTAAACTGGCTG 
AAAAGT TT TAAAGGTCTAAGGGAGAATACAAT TATCTGTG C CAGT C CCAAAGAGCTG CAAGG 
AGTAAATGTGATCGATGCAGTGAAGAACTACAGCATCTGTGGCAAAAGTACTACAGAGAGGT 
TTGATCTGGCCAGGGCTCTCCCAAAGCCGACGTTTAAGCCCAAGCTCCCCAGGCCGAAGCAT 
GAGAGCAAACCCCCTTTGCCCCCGACGGTGGGAGCCACAGAGCCCGGCCCAGAGACCGATGC 
TGACGCCGAGCACATCTCTTTCCATAAAATCATCGCGGGCAGCGTGGCGCTTTTCCTGTCCG 
TG CT CGTCAT C CTG CT GGTT AT CTACGTGTCATGGAAGCGGTACCCTGCGAG CATGAAGCAG 
CTGCAG CAG CGCTC CCTCATGCGAAGGCACAGGAAAAAGAAAAGACAGTC C CTAAAGCAAAT 
GACT CC CAG CAC CCAGGAATTTTATGTAGATT ATAAAC CCAC CAACACGGAGAC CAG CGAGA 
TGCTGCTGAATGGGACGGGACCCTGCACCTATAACAAATCGGGCTCCAGGGAGTGTGAGGTA 
T^^CCATTGTGATAAAAAGAGCTCTTAAAAGCTGGGAAATAAGTGGTGCTTTATTGAACTC 
TGGTGACTATCAAGGGAACGCGATGCCCCCCCTCCCCTTCCCTCTCCCTCTCACTTTGGTGG 
CAAGATCCTTCCTTGTCCGTTTTAGTGCATTCATAATACTGGTCATTTTCCTCTCATACATA 
ATCAACCCATTGAAATTTAAATACCACAATCAATGTGAAGCTTGAACTCCGGTTTAATATAA 
TACCTATTGTATAAGACCCTTTACTGATTCCATTAATGTCGCATTTGTTTTAAGATAAAACT 
TCTTTCATAGGTAAAAAAAAAAA 
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FIGURE 226 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA77301 
xsubunit 1 of 1, 513 aa, 1 stop 
><MW: 58266, pi: 9.84, NX{S/T): 4 

MGFWIRLLSGSAVALVIAPTVLLTMLSSAERGCPKGCRCEGKMVYCESQKLQEIPSSISAG 
CLGLSLRYNSLQKLKYNQFKGLNQLTWLYLDHNHISNIDENAFNGIRRLKELILSSNRISYF 
I^NTFRPVTNLRKLDLSYNQLHSLGSEQFRGLRKLLSLHLRSNSLRTIPVRIFQDCRNLELL 
DLGYNRIRSLARNVFAGMIRLKELHLEHNQFSKIjNLALFPRLVSLQNLYLQWNKISVIGQTM 
SWTWSSLQRLDLSGNE I EAFSG PS VFQCVPNLQRLNLDSNKLTF IGQE ILDSWISLND I SLA 
GNI WECSRNI CSLVNWLKSFKGLRENTI I CAS PKELQGVNVI DAVKNYS I CGKSTTERFDLA 
RALPKPTFKPKLPRPKHESKPPLPPTVGATEPGPETDADAEHISFHKIIAGSVALFLSVLVI 

LLVIYVSWKRYPASMKQLQQRSLMRRHRKKKRQSLKQMTPSTQEFYVDYKPTNTETSEMLLN 
GTGPCTYNKSGSRECEV 

Important features of the protein: 
Signal peptide: 

amino acids 1-33 

Transmembrane domain: 

amino acids 420-442 

N-glycosylation sites. 

amino acids 126-129, 357-360, 496-499, 504-507 

CAMP- and cGMP-dependent protein kinase phosphorylation site. 

amino acids 465-468 

Tyrosine kinase phosphorylation site. 

amino acids 136-142 

N-myristoylation sites. 

amino acids 11-16, 33-38, 245-250, 332-337, 497-502, 507-512 



WO 00/12708 



PCT/US99/20111 



FIGURE 227 

AGTT CTGAGAAAGAAGGAAATAAACACAGGCACCAAAC CACTATCCTAAGTTGACTGTCCTT 
TAAAT A£GTCAAGAT C CAGACTTTT CAGTGTC AC CT CAGCGAT CT C AACG AT AGGGATCTTG 
TGTTTGCCGCTATTCCAGTTGGTGCTCTCGGACCTACCATGCGAAGAAGATGAAATGTGTGT 
AAATTATAATGACCAACACCCTAATGGCTGGTATATCTGGATCCTCCTGCTGCTGGTTTTGG 
TGGCAGCTCTTCTCTGTGGAGCTGTGGTCCTCTGCCTCCAGTGCTGGCTGAGGAGACCCCGA 
ATTGATTCTCACAGGCGCACCATGGCAGTTTTTGCTGTTGGAGACTTGGACTCTATTTATGG 
GACAGAAGCAGCTGTGAGTCCAACTGTTGGAATTCACCTTCAAACTCAAACCCCTGACCTAT 
ATCCTGTTCCTGCTCCATGTTTTGGCCCTTTAGGCTCCCCACCTCCATATGAAGAAATTGTA 
AAAACAAC CTGATTTT AG GT GTGG AT TATCAATTTAAAGT ATTAACGACATCTGT AATTCCA 
AAAC AT CAAATTTAGGAATAGTTATTTC AG TTGTTGGAAATGT C CAGAGATCT ATTCAT AT A 
GTCTGAGGAAGGACAATTCGACAAAAGAATGGATGTTGGAAAAAATTTTGGTCATGGAGATG 
TTTAAATAGT AAAGT AGC AG GCTTTT GATGTGT CACTG CTGTATCATACTTTTATG CTACAC 
AACCAAATTAATGCTTCTCCACTAGTATCCAAACAGGCAACAATTAGGTGCTGGAAGTAGTT 
TCCATCACATTTAGGACTCCACTGCAGTATACAGCACACCATTTTCTGCTTTAAACTCTTTC 
CT AG CAT GGGGT CCATAAAAATTATTATAATTTAACAATAG CC CAAG C CGAGAATCCAAC AT 
GT C C AG AAC CAG AA C CAGAAAGAT AGTA TT TG AATG AAGG TG AGG G G AGAG AGT AG GAAAAA 
GAAAAGTTTGGAGTTGAAGGGTAAAGGATAAATGAAGAGGAAAAGGAAAAGATTACAAGTCT 
CAGC AAAAACAAG AGGTTTTATGCC CCAAC CT GAAGAGGAAG AAATTG TAGAT AGAAGGTGA 
AGGAGATTGCTGAAGATATAGAGCACATATAATGCCAACACGGGGAGAAAAGAAAATTTCCC 
CTTTTACAGTAATGAATGTGGCCTCCATAGTCCATAGTGTTTCTCTGGAGCCTCAGGGCTTG 
GCATTT ATTG CAG CAT CATG CT AAGAAC CT T CGGCATAGGTATCTGTT CCCATGAGGACTG C 
AG AAGT AG CAAT GAGA CATC TT CAAG T G G CAT T TTGG CAGT GG C CAT CAG C AGGG GGA CAG A 
CAAAAACATCCATCACAGATGACATATGATCTTCAGCTGACAAATTTGTTGAACAAAACAAT 
AAACAT CAAT AG AT ATCTAAAAA 



23C/270 
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FIGURE 228 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA77303 
xsubunit l of 1, 146 aa, 1 stop 
><MW: 16116, pis 4.99, NX(S/T): 0 

MSRSRLFSVTSAISTIGILCLPLFQLVLSDLPCEEDEMCVNYNDQHPNGWYIWILLLLVLVA 
ALLCGAWLCLQCWLRRPRIDSHRRTMAVFAVGDLDS I YGTEAAVS PTVGIKLQTQTPDLYP 
VPAPCFGPLGSPPPYEEIVKTT 

Signal peptide: 

amino acids 1-29 

Transmembrane domain: 

amino acids 52-70 



jz3/ /2 yo 
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FIGURE 229 

GAGCGGAGTAAAAT CTCCACAAG CTGGGAACAAACCTCGT C CCAACTC C C AC CCAC CGG CGT 
TTCTCCAGCTCGATCTGGAGGCTGCTTCGCGAGTGTGGGACGCAGCTGACGCCCGCTTATTA 
GCTCTCGCTGCGTCGCCCCGGCTCAGAAGCTCCGTGGCGGCGGCGACCGTGACGAGAAGCCC 
ACGGCCAGCTCAGTTCTCTTCTACTTTGGGAGAGAGAGAAAGTCAGATGCCCCTTTTAAACT 
CCCT CTTCAAAACT C ATC TC CTGGGTGACT GAGTTAAT AGAGTGGATACAAC CTTGCTG AAG 
ATGAAGAATATACAATATTG AGGATATTTT TTTCTTT T TTTTTTCAAGTCTTGATTTGTGGC 
TTACCTCAAGTTACCATTTTTCAGTCAAGTCTGTTTGTTTGCTTCTTCAGAAATGTTTTTTA 
CAATCT CAAGAAAAAATATGT CCCAGAAATTG AGTTTACTG TTGCT T GTATTTGGACTCATT 
TGGGGATTGATGTTACTGCACTATACTTTTCAACAACCAAGACATCAAAGCAGTGTCAAGTT 
ACGTGAGCAAATACTAGACTTAAGCAAAAGATATGTTAAAGCTCTAGCAGAGGAAAATAAGA 
ACACAGTGGATGTCGAGAACGGTGCTTCTATGGCAGGATATGCGGATCTGAAAAGAACAATT 
GCTGTCCTTCTGGATGACATTTTGCAACGATTGGTGAAGCTGGAGAACAAAGTTGACTATAT 
TGTTGTGAATGG CT CAGC AGC C AACACCACCAATGGTACTAGTGGGAATTTGGTGC CAGTAA 
CC ACAAAT AAAAGAACGAAT GT CTCGGG CAGT AT CAGATAGCAGTTGAAAAT CAC C TTGTGC 
TG CT CC ATCCACTGTGGATTATATC CTATGGC AGAAAAGCTTT ATAATTG CTGG CT TAGGAC 
AG AGCAAT ACTTT A CAATAAAAGCT CTACACATTTTCAAGGAGTATG C TGGATT CATGGAAC 
TCTAATT CTGTACATAAAAATTTT AAAGTTATTT GTTTGCTTT C AGGCAAGT CTGTTCAATG 
CTGTACTATGTCCTTAAAGAGAATTTGGTAACTTGGTTGATGTGGTAAGCAGATAGGTGAGT 
TTTGTATAAATCTTTTGTGTTTGAGATCAAGCTGAAATGAAAACACTGAAAAACATGGATTC 
ATTT CT ATAACACATTTATTTAAGTATATAACACGT TTTT TGGACAAGTGAAGAATGT TTAA 
TC ATTCTGT CATTT GTTCTCAATAGATGTAACTGTTAG AC TACGG CTATTTGAAAAAATGTG 
CTTATTGTACTATATTTTGTTATTCCAATTATGAGCAGAGAAAGGAAATATAATGTTGAAAA 
TAATGTTTTGAAAT CATGAC CCAAAG AATG TATTGATTTG CAC T ATCCTT CAGAATAACTGA 
AGGTTAATTAT TGT ATAT TT TT AAAAATTACACTTATAAGAGTATAAT CTTGAAATGGGT AG 
CAGCCACTGT C CAT TAC CTAT CGT AAACATTGGG GC AATTTAATAACAG CATT AAAATAGTT 
GTAAACTCTAATCTTATACTTATTGAAGAATAAAAGATATTTTTATGATGAGAGTAACAATA 
AAGTATTCATGATTTTTCACATACATGAATGTTCATTTAAAAGTTTAATCCTTTGAGTGTCT 
ATGCTATCAGGAAAGCACATTATTTCCATATTTGGGTTAATTTTGCTTTTATTATATTGGTC 
TAGG AGGAAGGGACTTTGGAG AATGGAACT CTTGAGGACITTAGC CAGGTGTAT AT AATAAA 
GGTACTTTTGTGCTGCATTAAATTGCTTGGAAAGTGTTAACATTATATTATATAAGAGTATC 
CTTTATGAAATTTT GAATTT GT ATAACAGATGCATTAGATATTCATTTTATATAATGGCCAC 
TT AAAATAAG AACATTTAAAATATAAACTATGAAGATTGACTAT CTTTT CAGGAAAAAAG CT 
GTATATAGCACAGGGAACCCTAATCTTGGGTAATTCTAGTATAAAACAAATTATACTTTTAT 
TTAAATTTCCCTTGTAGCAAATCTAATTGCCACATGGTGCCCTATATTTCATAGTATTTATT 
CTCTATAGTAACTGCTTAAGTGCAGCTAGCTTCTAGATTTAGACTATATAGAATTTAGATAT 
TGTATTGTTCGTCATTATAATATGCTACCACATGTAGCAATAATTACAATATTTTATTAAAA 
TAAATATGTGAAATATTGTTTCATGAAAGACAGATTTCCAAATCTCTCTTCTCTTCTCTGTA 
CTGTCTACCTTTATGTGAAGAAATTAATTATATGCCATTGCCAGGT 
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FIGURE 230 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA77648 

xsubunit 1 of 1, 140 aa, 1 stop. ! 
><MW: 15668, pi: 10.14, NX(S/T): 5 

MFFTI SRKNMSQKLSLLLLVFGL I WGLMLLHYTFQQ PRHQSSVKLREQ ILDLSKRYVKALAE 
ENKNT VD VEN GAS M AG YAD L KRT I AVLL DD I LQRLVKLENKVDYI WNGSAANTTNGTSGNL 
VPVTTNKRTNVSGS IR 

Important features of the protein; 
Signal peptide: 

amino acids 1-26 



A33/27* 
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FIGURE 231 



CGCGGCCGGGCCGCCGGGGTGAGCGTGCCGAGGCGGCTGTGGCGCAGGCTTCCAGCCCCCAC 
CATGC C G TG G CC CCTGCTGCTGCTG CTGG C CGTG AGTGGGG C C C AGAC AACC CGGC CATG CT 
TCCCCGGGTGCCAATGCGAGGTGGAGACCTTCGGCCTTTTCGACAGCTTCAGCCTGACTCGG 
GTGGATTGTAGCGGCCTGGGCCCCCACATCATGCCGGTGCCCATCCCTCTGGACACAGCCCA 
CTTGGACCTGTCCTCCAACCGGCTGGAGATGGTGAATGAGTCGGTGTTGGCGGGGCCGGGCT 
ACACGACGTTGGCTGGCCTGGATCTCAGCCACAACCTGCTCACCAGCATCTCACCCACTGCC 
TTCTCCCGCCTTCGCTACCTGGAGTCGCTTGACCTCAGCCACAATGGCCTGACAGCCCTGCC 
AGCCGAGAGCTTCACCAGCTCACCCCTGAGCGACGTGAACCTTAGCCACAACCAGCTCCGGG 
AGGTCTCAGTGTCTGCCTTCACGACGCACAGTCAGGGCCGGGCACTACACGTGGACCTCTCC 
CACAACCTCATTCACCGCCTCGTGCCCCACCCCACGAGGGCCGGCCTGCCTGCGCCCACCAT 
TCAGAGCCTGAACCTGGCCTGGAACCGGCTCCATGCCGTGCCCAACCTCCGAGACTTGCCCC 
TGCGCTACCTGAGCCTGGATGGGAACCCTCTAGCTCTCATTGGTCCGGGTGCCTTCGCGGGG 
CTGGGAGGCCTTACACACCTGTCTCTGGCCAGCCTGCAGAGGCTCCCTGAGCTGGCGCCCAG 
TGGCTTCCGTGAGCTACCGGGCCTGCAGGTCCTGGACCTGTCGGGCAACCCCAAGCTTAACT 
GGGCAGGAGCTGAGGTGTTTTCAGGCCTGAGCTCCCTGCAGGAGCTGGACCTTTCGGGCACC 
AACCTGGTGCCCCTGCCTGAGGCGCTGCTCCTCCACCTCCCGGCACTGCAGAGCGTCAGCGT 
GG GC CAGGATGTGCGGTGC CGGCGC CT GGTGCGG GAGGGCAC CTAC C C CCGGAGGC CTGGCT 
CCAGCCCCAAGGTGCCCCTGCACTGCGTAGACACCCGGGAATCTGCTGCCAGGGGCCCCACC 
ATCTTGTG^CAAATGGTGTGGCCCAGGGCCACATAACAGACTGCTGTCCTGGGCTGCCTCAG 
GTCCCGAGTAACTTATGTTCAATGTGCCAACACCAGTGGGGAGCCCGCAGGCCTATGTGGCA 
GCGTCACCACAGGAGTTGTGGGCCTAGGAGAGGCTTTGGACCTGGGAGCCACACCTAGGAGC 
AAAGTCTCACCCCTTTGTCTACGTTGCTTCCCCAAACCATGAGCAGAGGGACTTCGATGCCA 
AACCAGACTCGGGTCCCCTCCTGCTTCCCTTCCCCACTTATCCCCCAAGTGCCTTCCCTCAT 
GCCTGGGCCGGCCTGACCCGCAATGGGCAGAGGGTGGGTGGGACCCCCTGCTGCAGGGCAGA 
GTTCAGGTCCACTGGGCTGAGTGTCCCCTTGGGCCCATGGCCCAGTCACTCAGGGGCGAGTT 
TCTTTTCTAACATAGCCCTTTCTTTGCCATGAGGCCATGAGGCCCGCTTCATCCTTTTCTAT 
TTCCCTAGAACCTTAATGGTAGAAGGAATTGCAAAGAATCAAGTCCACCCTTCTCATGTGAC 
AGATGGGGAAACTGAGGCCTTGAGAAGGAAAAAGGCTAATCTAAGTTCCTGCGGGCAGTGGC 
ATGACTGGAGCACAGCCTCCTGCCTCCCAGCCCGGACCCAATGCACTTTCTTGTCTCCTCTA 
ATAAGCCCCACCCTCCCCGCCTGGGCTCCCCTTGCTGCCCTTGCCTGTTCCCCATTAGCACA 
GGAGTAGC AG CAGCAGGA CAGGCAAGAGCCTCACAAGTGGGACTC TGGG C CT CTGACCAGCT 
GTGCGGCATGGGCTAAGTCACTCTGCCCTTCGGAGCCTCTGGAAGCTTAGGGCACATTGGTT 
CCAGCCTAGCCAGTTTCTCACCCTGGGTTGGGGTCCCCCAGCATCCAGACTGGAAACCTACC 
CATT TT CC C CTGAG CAT CCTCTAGATG CTGC C C CAAGGAGTTGCTG CAGTTCTG GAGC CTCA 
TCTGGCTGGGATCTCCAAGGGGCCTCCTGGATTCAGTCCCCACTGGCCCTGAGCACGACAGC 
CCTT CTTACCCTCCCAGGAATGCCGTGAAAGGAGACAAGGTCTGCC CGACCCATGTCTATG C 
TCTACCCCCAGGGCAGCATCTCAGCTTCCGAACCCTGGGCTGTTTCCTTAGTCTTCATTTTA 
TAAAAGTTGTTGCCTTTTTAACGGAGTGTCACTTTCAACCGGCCTCCCCTACCCCTGCTGGC 
CGGGGATGGAGACATGTCATTTGTAAAAGCAGAAAAAGGTTGCATTTGTTCACTTTTGTAAT 
ATTGTCCTGGGCCTGTGTTGGGGTGTTGGGGGAAGCTGGGCATCAGTGGCCACATGGGCATC 
AGGGGCTGG C CC CACAGAGAC CCC ACAGGG CAGTG AG C T CTGTCTT C C CCCAC CTGC CT AGC 
CCAT CATCTATCTAAC CGGT C CTTGATTTAAT AAACAC TAT AAAAGGTTTAAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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FIGURE 232 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA77652 
xsubunit 1 of" 1, 3 53 aa, 1 atop 
><MW: 37847, pi: 6.80, NX(S/T): 2 

MPWPLLLLLAVSGAQTTRPCFPGCQCEVETFGLFDSFSLTRVDCSGLGPHIMPVPIPLDTAH 
LDLSSNRLEMVNESVLAGPGYTTLAGLDLSHNLLTSISPTAFSRLRYLESLDLSHNGLTALP 
AESFTSSPLSDVNLSHNQLREVSVSAFTTHSQGRALHVDLSHNLIHRLVPHPTRAGLPAPTI 
QSLNLAWNRLHAVPNLRDLPLRYLSLDGNPLAVIGPGAFAGLGGLTHLSLASLQRLPEIiAPS 
GFRELPGLQVLDLSGNPKLNWAGAEVFSGLSSLQELDLSGTNLVPLPEALLLHLPALQSVSV 
GQDVRCRRLVREGTYPRRPGSSPKVPLHCVDTRESAARGPTIL 

Signal peptide: 

amino acids 1-16 

Transmembrane domains: 

amino acids 215-232, 287-304 
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FIGURE 233 

GATGGCGCAGCCACAGCTTCTGTGAGATTCGATTTCTCCCCAGTTCCCCTGTGGGTCTGAGG 
GGAC CAGAAGGGTGAGCTACGTTGGCTTT C TGGAAGGGG AGG CTATATGCGT C AATT CC C C A 
AAACAAGTTTTGACATTTCCCCTGAAATGTCATTCTCTATCTATTCACTGCAAGTGCCTGCT 
GTTCCAGGC CTTACCTG CTGGG CACT AACGGC GG AG CC AGGATGGGGACAGAATAAAGGAG C 
CACGACCTGTGCC^CCAACTCGCACTCAGACTCTGAACTCAGACCTGAAATCTTCTCTTCAC 

gggaggcttggcagtttttcttactcctgtggtctccagatttcaggcctaagatgaaagcc 
tctagtcttgccttcagccttctctctgctgcgttttatctcctatggactccttccactgg 
actgaagacact caatttgggaagctgtgtgatcgc cacaaaccttcaggaaatacgaaatg 
gatttt ctgagatacgggg c agtgtg c aag c caaagatggaaacattgacatcagaat ctta 
aggaggactgagtctttgcaagacacaaagcctgcgaatcgatgctgcctcctgcgccattt 
g c t aagactc tatctg g acagggt atttaaaaact ac cagac cc ct g ac c att atact ct cc 
ggaagatcagcagcctcgccaattcctttcttaccatcaagaaggacctccggctctctcat 
gc ccacatgacatgccattgtggggaggaag caatgaag aaat acag c cagatt ctgagt c a 
ctttgaaaagctggaacctcaggcagcagttgtgaaggctttgggggaactagacattcttc 
tg caatggatggaggagacagaataggagg aaagtg atgc tg ctgctaagaatattcgaggt 
caagagctccagtcit:caatacctgcagaggaggcatgaccccaaaccaccatctctttact 
gtactagtcttgtgctggtcacagtgtatcttatttatgcattacttgcttccttgcatgat 
tgtctttatgcatccccaatcttaattgagaccatacttgtataagatttttgtaatatctt 
t ctgctattggatatattt attag ttaatatatttatttatt ttttg ctattt aatgtattt 
attttttt acttgg ac atgaaact tt aaaaaaatt c ac agatt at atttataacctgac tag 
ag c aggtgatgtat ttttatac ag taaaaaaaaaaaaccttgtaaattctagaagagtgg ct 
aggggggttattcatttgtattcaactaaggacatatttact catgctgatg ctctgtgaga 
tatttgaaattgaaccaatgactacttaggatgggttgtggaataagttttgatgtggaatt 
gcacatctaccttacaattactgaccatccccagtagactccccagtcccataattgtgtat 
cttccagccaggaatcctacacggccagcatgtatttctacaaataaagttttctttgcata 

CCAAAAAAAAAAAAAAAAAAA 



A3S/2.7d 
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FIGURE 234 

></usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA83500 
xsubunit 1 of 1, 261 aa, l stop 
><MW: 29667, pi: 8.76, NX(S/T): 0 

MRQFPKTSFDISPEMSFStYSLQVPAVPGLTCWALTAEPGWGQNKGATTCATNSHSDSELRP 
EIFSSREAWQFFLLLWSPDFRPKMKASSl^FSLLSAAFYLLWTPSTGLKTLNMSCVIATNL 
QE IRNGFS E I RGSVQAKDGNID IR ILRRTES LQDTKPANRCCLLRHLLRLYLDRVFKNYQTP 
DHYTLRKISSLANSFLTIKKDLRLSHAHMTCHCGEEAMKKYSQILSHFEKLEPQAAVVKALG 
ELD I LLQWMEETE 

Important features of the protein: 
Signal peptide: 

amino acids 1-42 

cAMP- and cGMP- dependent protein kinase phosphorylation sites. 

amino acids 192-195, 225-228 

N-myristoylation sites . 

amino acids 42-47, 46-51, 136-141 
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FIGURE 235 

CCGTTAT.CGTCTTGCGCTACTGCTGAATGTCCGTCCCGGAGGAGGAGGAGAGGCTTTTGCCG 
CTGACCCAGAGATGGCCCCGAGCGAGCAAATTCCTACTGTCCGGCTGCGCGGCTACCGTGGC 
CGAGCTAGCAACCTTTCCCCTGGATCTCACAAAAACTCGACTCCAAATGCAAGGAGAAGCAG 
CT CTTG CT CGGT TGGGAGACGG TG CAAGAGAATC TG C C C CCT ATAGGGGAAT GGTG CG CACA 
G CC CTAGGGAT CATTG AAGAGGAAGG CTTT CTAAAGCTTTGG CAAGGAGT GACAC C CGCCAT 
TTACAGACACGT AGTG T ATT CTGG AGGTCG AATG GT CAC ATATGAA GAT CTCCG AGAGGTTG 
TGTTTGGCAAAAGTGAAGATGAGCATTATCCCCTTTGGAAATCAGTCATTGGAGGGATGATG 
GCTGGTGTTATTGGCCAGTTTTTAGCCAATCCAACTGACCTAGTGAAGGTTCAGATGCAAAT 
GGAAGGAAAAAGGAAACTGGAAGGAAAACCATTGCGATTTCGTGGTGTACATCATGCATTTG 
CAAAAATCTTAG CTGAAGGAGG AAT ACGAGGGCTTTGGGCAGG CTGGGTACCCAATATACAA 
AGAG C AG C ACTGGTGAAT ATGGG AG ATTTAAC CACTTATGATAC AG TGAAACACT ACT TGGT 
ATTG AATACACC ACTTGAGGACAAT ATCAT GACTCACGGTTTAT CAAGTTT ATG TT CTGGAC 
TGGT AGCTTCTATTCTGGGAA CAC CAG CCG ATGT CAT C AAAAGCAG AATAATGAAT CAAC CA 
CG AGATAAAC AAGG AAGGGGACTTTTGT AT AAAT CAT CG ACTGACTGCTT GATT C AGG CTGT 
TCAAGGTGAAGGATTCATGAGTCTATATAAAGGCTT TTTACCAT CTTGGCTG AGAATGACCC 

CTTGGTCAATGGTGTTCTGGCTTACTTATGAAAAAATCAGAGAGATGAGTGGAGTCAGTCCA 
TTTTAA 
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FIGURE 236 

></usr/seqdb2/ast/DNA/Dnaseqs.min/ss.DNA77568 ' 
xsubunit 1 of 1, 323 aa, 1 stop 
><MW: 36064, pi: 9.33, NX(S/T): 1 

MSVPEEEERLLPLTQRWPRASKFLLSGCAATVAELATFPLDLTKTRLQM 
RESAPYRGMVRTALGI IEEEGFLKLWQGVTPAIYRHWYSGGRMVTYEHLREVVFGKSEDEH 
YPLWKSVIGGMMAGVIGQFLANPTDLVK^QMQMEGK^ 

RGLWAGOTPNIQRAALVNMGDLTTYDTVKHYLVLNTPLEDNIMTHGLSSLCSGLVASILGTP 
ADVIKSRIMNQPRDKQGRGLLYKSSTDCLIQAVQGEGFMSLYKGFLPSWLRMTPWSMVFWLT 
YEKIREMSGVSPF 

Transmembrane domains : 

amino acids 25-38, 130-147, 233-248 
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FIGURE 237 

CGGACGCGTGGGCGCGGGACGCCGGCAGGGTTGTGGCGCAGCAGTCTCCTTCCTGCGCGCGC 
GCCTGAAGTCGGCGTGGGCGTTTGAGGAAGCTGGGATACAGCATTTAATGAAAAATTTATGC 
TTAAGAAGTAAAAATGGCAGGCTT CCTAGATAATTTT CGTTG GCCAGAATGTGAATGT ATTG 
ACTGGAGTGAGAGAAGAAATGCTGTGG CATCTGT TGT CGC AGGTATATTG TTTTTT AC AGGC 
TGGTGGATAATGATTGATGCAGCTGTGGTGTATCCTAAGCCAGAACAGTTGAACCATGCCTT 
TCACACATGTGGTGTATTTTCCACATTGGCTTTCTTCATGATAAATGCTGTATCCAATGCTC 
AGGTGAGAGGTG AT AG CT ATGAAAG C G G CT GTTT AGGAAGAACAGGTGCT CGAGTTTGGCTT 
TTCATTGGTTTCATGTTGATGTTTGGGTCACTTATTGCTTCCATGTGGATTCTTTTTGGTGC 
ATATGTTACCCAAAATACTGATGTTTATCCGGGACTAGCTGTGTTTTTTCAAAATGCACTTA 
TATTTT TT AG CACT CTGATC T ACAAATT TGGAAG AAC CGAAGAG CTATGG AC C£GAGAT C A C 
TTCTTAAGTCACATTTTCCTTTTGTTATATTCTGTTTGTAGATAGGTTTTTTATCTCTCAGT 
ACACATTGCCAAATGGAGTAGATTGTACATTAAATGTTTTGTTTCTTTACATTTTTATGTTC 
TGAGTTTTGAAATAGTTTTATGAAATTTCTTTATTTTTCATTGCATAGACTGTTAATATGTA 
TATAATAC AAGACTATATGAATTGGATAATGAGTAT CAGTTTTTTATTC CTGAGATTT AGAA 
CTTGATCTACTCCCTGAGCCAGGGTTACATCATCTTGTCATTTTAGAAGTAACCACTCTTGT 
CTCTCTGGCTGGGCACGGTGGCTCATGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGCGGG 
CCGATTGCTTGAGGTCAAGTGTTTGAGACCAGCCTGGCCAACATGGCGAAACCCCATCTACT 
AAAAATACAAAAATTAGC CAGGCATGGTGGTGGGTG CCTGTAAT CCCAG C TACCTGGGAGG C 
TGAGGCAGGAGAATCGCTTGAACCCGGGGGGCAGAGGTTGCAGTGAGCTGAGTTTGCGCCAC 
TGCACTCTAGCCTGGGGGAGAAAGTGAAACTCCCTCTCAAAAAAAAGACCACTCTCAGTATC 
TCTGATTT CTGAAGATGTACAAAAAAAT AT AG CTT CAT ATATCTGGAATGAG CACTGAGC CA 
TAAAAGGTTTT CAG CAAG TTGT AACTTATTTTGGCCT AAAAATGAGGTTTTTTTGGTAAAGA 
AAAAAT AT TTGTTCTTATGTATTGAAG AAGTGT ACTTTTATATAAT GATTTTTTAAATG C C C 
AAAGGACTAGTTTGAAAGCTT CTTTTAAAAAG AATTC CT CTAATATGACTTTATGTGAGAA 
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FIGURE 238 

MAGFLDNFRWPECECIDWSERRNAVASWAGILFFTGWWIMIDAAWYPKPEQLNHAFHTCG 
VFSTLAFFMINAVSNAQTOGDSYESGCLGRTGARVV^FIGFMLMFGSLIAS^ILFGAYVTQ 
NTDVYPGLAVFFQNALIFFSTLIYKFGRTEELWT 

Important features: 
Signal peptide: 
amino acids 1-44 

Transmembrane domains: 

amino acids 23-42 (type II), 60-80, 97-117, 128-148 
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FIGURE 239 

GTTGATGGCAAACTTCCTCAAAGGAGGGGCAGAGCCTGCG CAGGGCAGGAGC AGCTGGCC CA 
CTGGCGGCCCGCAACACTCCGTCTCACCCTCTGGGCCCACTGCATCTAGAGGAGGGCCGTCT 
GTGAGGCCACTACCCCTCCAGCAACTGGGAGGTGGGACTGTCAGAAGCTGGCCCAGGGTGGT 
GGTCAGCTGGGTCAGGGACCTACGGCACCTGCTGGACCACCTCGCCTTCTCCATCGAAGCAG 
GGAAGTGGGAGCCTCGAGCCCTCGGGTGGAAGCTGACCCCAAGCCACCCTTCACCTGGACAG 
GATGAGAGTGTCAGGTGTGCTTCGCCTCCTGGCCCTCATCTTTGCCATAGTCACGACATGGA 
TGTTTATT CGAAG C TACATG AGCTTCAG CATGAAAACC AT CC GTCTGC CACGCTGGCTGGCA 
GCCTCGCCCACCAAGGAGATCCAGGTTAAAAAGTACAAGTGTGGCCTCATCAAGCCCTGCCC 
AGCCAACTACTTTGCGTTTAAAATCTGCAGTGGGGCCGCCAACGTCGTGGGCCCTACTATGT 
GCTTTGAAGACCGCATGATCATGAGTCCTGTGAAAAACAATGTGGGCAGAGGCCTAAACATC 
GCCCTGGTGAATGGAACCACGGGAGCTGTGCTGGGACAGAAGGCATTTGACATGTACTCTGG 
AGATGTTATG CAC CT AGTGAAATT CCTTAAAGAAATTC CG GGGGGT GC AC TGGT GCTGGTGG 
CCTCCTACGACGATC CAGGGACCAAAATGAACGATGAAAGCAGGAAACTCTT CTCTGACTTG 
GGGAGTTCCTACGCAAAACAACTGGGCTTCCGGGACAGCTGGGTCTTCATAGGAGCCAAAGA 
CCTCAGGGGTAAAAGCCCCTTTGAGCAGTTCTTAAAGAACAGCCCAGACACAAACAAATACG 
AGGGATGGCCAGAGCTGCTGGAGATGGAGGGCTGCATGCCCCCGAAGCCATTTTAGGGTGGC 
TGTGGCTCTTCCTCAGCCAGGGGCCTGAAGAAGCTCCTGCCTGACTTAGGAGTCAGAGCCCG 
GCAGGGGCTGAGGAGGAGGAGCAGGGGGTGCTGCGTGGAAGGTGCTGCAGGTCCTTGCACGC 
TGTGTCGCGCCTCTCCTCCTCGGAAACAGAACCCTCCCACAGCACATCCTACCCGGAAGACC 
AGCCTCAGAGGGTCCTTCTGGAACCAGCTGTCTGTGGAGAGAATGGGGTGCTTTCGTCAGGG 
ACTG CTGACGGC TGGT C CT G AGG AAGGACAAAC TGC CCAGACTTGAGC C CAATT AAATTTTA 
TTTTTGCTGGTTTTGAAAAAAAAAAAAAAAAAAAA 
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FIGURE 240 

</usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA59814 
oubunit 1 of 1, 224 aa, 1 stop 
<MW: 24963, pi: 9.64, NX(S/T): 1 

mrvsgvi^llalifaivtt™firsymsfsmktirlprwlaasptkeiqvkkykcglikpcp 
anyf afki cs gaanwgptmcfedrmims p vknnvgrglni alvngttgavlgqkafdmysg 
dvmhlvkflke i pggalvlvas yddpgtkmndesrklfsdlgssyakqlgfrdswvfigakd 
lrgks p feqflkns pdtnkyegwpellemegcmp pkpf 

Important features: 
Signal peptide: 

amino acids- 1-15 

ATP/GTP -binding site motif A (P-loop) . 

amino acids 184-191 

N-glycosylation site. 

amino acids 107-110 
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FIGURE 241 

GAGA CT GCAGAGGGAGAT AAAG AGAG AGGGCAAAGAGG CAGCAAGAGATTT GTCCTGGG GAT 
C CAGAAAC CCATGAT A CC CT ACTGAAC AC C GAAT C C CCTG G AAG CCC AC AG AGACAGAGACA 
GCAAGAG AAGC AGAGATAAATACACTCACG C CAGGAGCTCGCT CG CT CT CT C TCTCT CT CT C 
TCACTCCTCCCTCCCTCTCTCTCTGCCTGTCCTAGTCCTCTAGTCCTCAAATTCCCAGTCCC 
CTGCACCCCTTCCTGGGACACTA2STTGTTCTCCGCCCTCCTGCTGGAGGTGATTTGGATCC 
TGGCTGCAGATGGGGGTCAACACTGGACGTATGAGGGCCCACATGGTCAGGACCATTGGCCA 
GCCTCTTACCCTG AGTGTGGAAACAATGC CCAGTCGCC CAT CGATATTCAGACAGACAGTGT 
GACATTTGACCCTGATTTGCCTGCTCTGCAGCCCCACGGATATGACCAGCCTGGCACCGAGC 
CTTTGGACCTGCACAACAATGGCCACACAGTGCAACTCTCTCTGCCCTCTACCCTGTATCTG 
GGTGGACTTCCCCGAAAATATGTAGCTGCCCAGCTCCACCTGCACTGGGGTCAGAAAGGATC 
CCCAGGGGGGTCAGAACACCAGATCAACAGTGAAGCCACATTTGCAGAGCTCCAGATTGTAC 
ATTATGACTCTGATTCCTATGACAGCTTGAGTGAGGCTGCTGAGAGGCCTCAGGGCCTGGCT 
GTCCTGGG CATCCTAATTGAGGTGGGTGAGACTAAGAATATAGCTTATGAACACATTCTGAG 
TCACTTGCATGAAGTCAGGCATAAAGATCAGAAGACCTCAGTGCCTCCCTTCAACCTAAGAG 
AGCTGCTCCCCAAACAGCTGGGGCAGTACTTCCGCTACAATGGCTCGCTCACAACTCCCCCT 
TGCTACCAGAGTGTGCTCTGGACAGTTTTTTATAGAAGGTCCCAGATTTCAATGGAACAGCT 
GGAAAAGCTTCAGGGGACATTGTTCTCCACAGAAGAGGAGCCCTCTAAGCTTCTGGTACAGA 
ACTACCGAGCCCTTCAGCCTCTCAATCAGCGCATGGTCTTTGCTTCTTTCATCCAAGCAGGA 
TCCTCGTATACCACAGGTGAAATGCTGAGTCTAGGTGTAGGAATCTTGGTTGGCTGTCTCTG 
CCTT CTC CTGGCTGTTTATTTCATTGCTAGAAAGATTCGGAAGAAGAGGCTGGAAAAC CGAA 
AGAGTG TGG T CTT CA C CTCAGCACAAGCCACGACTGAGGCATAAAT TC CTT C TC AG AT AC CA 
TGGATGTGGATGACTTCCCTTCATGCCTATCAGGAAGCCTCTAAAATGGGGTGTAGGATCTG 
GCCAGAAACACTGTAGGAGTAGTAAGCAGATGTCCTCCTTCCCCTGGACATCTCTTAGAGAG 
GAATGGACCCAGGCTGTCATTCCAGGAAGAACTGCAGAGCCTTCAGCCTCTCCAAACATGTA 
GGAGGAAATGAGGAAATCGCTGTGTTGTTAATGCAGAGANCAAACTCTGTTTAGTTGCAGGG 
GAAGTTTGGGATATACCCCAAAGTCCTCTACCCCCTCACTTTTATGGCCCTTTCCCTAGATA 
TACTGCGGGATCT CTC CTTAGGAT AAAGAGTTGCTGTTGAAGTTGTATATTTTTGATCAATA 
TATTTGGAAATTAAAGTTTCTGACTTT 
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FIGURE 242 

x/usr/seqdb2/sst/DNA/Dnaseqs.min/ss.DNA62812 
xsubunit 1 of 1, 337 aa, 1 stop 
><MW: 37668, pi: 6.27, NX{S/T): 1 

MLFSAIiLEVIWILAADGGQHWTYEGPHGQDHWPASYPECGNNAQSPIDIQTDSVTFDPDLP 
ALQPHGYDQPGTEPLDLHNNGHTVQLSLPSTLYLGGLPRKYVAAQLHLHWGQKGSPGGSEHQ 
INSEATFAELHIVKYDSDSYDSLSEAAERPQGLAVLGILIEVGETKNIAYEHILSHLHEVRH 
KDQKTSVPP FNLRELLPKQLGQYFR YNGS LTTPPCYQS VLWTVFYRRSQ I SMEQLEKLQGTL 
FSTEEEPSKLLVQNYRALQPLNQRMVFASFIQAGSSYTTGEMLSLGVGILVGCLCLLLAVYF 
I ARKI RKKRLENRKS WFTS AQATTEA 

Important features of the protein: 
Signal peptide: 

amino acids 1-15 

Transmembrane domain : 

amino acids 291-310 

N-glycosylation site. 

amino acids 213-216 

Eukaryotic- type carbonic anhydrases proteins 

amino acids 197-245, 104-140, 22-69 
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FIGURE 243 

AATTTTTCACCAGAGTAAACTTGAGAAACCAACTGGACCTTGAGTATTGTACATTTTGCCTC 
GTGGACCCAAAGGTAGCAATCTGAAACATSAGGAGTACGATTCTACTGTTTTGTCTTCTAGG 
ATCAACTCGGTCATTACCACAGCTCAAACCTGCTTTGGGACTCCCTCCCACAAAACTGGCTC 
CGGATCAGGGAACACTACCAAACCAACAGCAGTCAAATCAGGTCTTTCCTTCTTTAAGTCTG 
AT ACCATTAACACAGATG CT CACACTGGGG CC AG AT CTG CAT CT GTTAAATCCTGCTG C AGG 
AATGACACCTGGTACCCAGACCCACCCATTGACCCTGGGAGGGTTGAATGTACAACAGCAAC 
TGCACCCACATGTGTTACCAATTTTTGTCACACAACTTGGAGCCCAGGGCACTATCCTAAGC 
TC AGAGGAATTGCCACAAAT CTTCACGAGC CT CATCATCCATTCCTTGTTCCCGGGAGGCAT 
CCTGCCCACCAGTCAGGCAGGGGCTAATCCAGATGTCCAGGATGGAAGCCTTCCAGCAGGAG 
GAGCAGGTGTAAATCCTGCCACCCAGGGAACCCCAGCAGGCCGCCTCCCAACTCCCAGTGGC 
ACAGATGACGACTTTGCAGTGACCACCCCTGCAGGCATCCAAAGGAGCACACATGCCATCGA 
GGAAGC CACCACAG AATCAG CAAATGGAATTCAGTAAGCTGTTTCAAATTTTTT CAACTAAG 
CTGC CT CGAATTTGGTGATACATGTGAATCTTTATCATTGATTATATTATGGAATAGATTGA 
GA CACATTGG ATAGT CTTAGAAGAAATTAATTCTTAATTT AC CT GAAAATATTCTTGAAATT 
TCAGAAAATATGTTCTATGTAGAGAATCCCAACTTTTAAAAACAATAATTCAATGGATAAAT 
CTGTCTTTGAAATATAAC ATTAT G CTG C C TGGATGATATG CATATT AAAACATATTTGGAAA 

ACTGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
AAAAAAAAAAAAAAAAAAA 
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FIGURE 244 

MRSTILLFCLLGSTRSLPQLKPALGLPPTKLAPDQGTLPNQQQSNQVFPSLSLIPLTQM 
LTI^PDLHLLNPAAGMTPGTQTHPLTLGGIWQQQLHPHVLPIFVTQLGAQGTILSSEE 
LPQIFTSLIIHSLFPGGILPTSQAGANPDVQDGSLPAGGAGVNPATQGTPAGRLPTPSG 
TDDDFAVTTPAGIQRSTHAIEEATTESANGIQ 

Signal peptide: 

amino acids 1-16 
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FIGURE 245 



GGAGAGAGGCGCGCGGGTGAAAGGCGCATTGATGCAGCCTGCGGCGGCCTCGGAGCGCGGCG 
GAGCCAGACGCTGACCACGTTCCTCTCCTCGGTCTCCTCCGCCTCCAGCTCCGCGCTGCCCG 
GCAGCCGGGAGCCATGCGACCCCAGGGCCCCGCCGCCTCCCCGCAGCGGCTCCGCGGCCTCC 
TGCTGCTCCTGCTGCTGCAGCTGCCCGCGCCGTCGAGCGCCTCTGAGATCCCCAAGGGGAAG 
CAAAAGGCGCAGCTCCGGCAGAGGGAGGTGGTGGACCTGTATAATGGAATGTGCTTACAAGG 
GCCAGCAGGAGTGCCTGGTCGAGACGGGAGCCCTGGGGCCAATGTTATTCCGGGTACACCTG 
GGATCCCAGGTCGGGATGGATTCAAAGGAGAAAAGGGGGAATGTCTGAGGGAAAGCTTTGAG 
GAGTCCTGGACACCCAACTACAAGCAGTGTTCATGGAGTTCATTGAATTATGGCATAGATCT 
TGGGAAAATTGCGGAGTGTACATTTACAAAGATGCGTTCAAATAGTGCTCTAAGAGTTTTGT 
TCAGTGGCTCACTTCGGCTAAAATGCAGAAATGCATGCTGTCAGCGTTGGTATTTCACATTC 
AATGGAGCTGAATGTTCAGGACCTCTTCCCATTGAAGCTATAATTTATTTGGACCAAGGAAG 
CCCTGAAATGAATTCAACAATTAATATTCATCGCACTTCTTCTGTGGAAGGACTTTGTGAAG 
GAATTGGTGCTGGATTAGTGGATGTTGCTATCTGGGTTGGCACTTGTTCAGATTACCCAAAA 
GGAGATGCTTCTACTGGATGGAATTCAGTTTCTCGCATCATTATTGAAGAACTACCAAAA^ 
^TGCTTTAATTTTCATTTGCTACCTCTTTTTTTATTATGCCTTGGAATGGTTCACTTAAAT 
GACATT TTAAAT AAGTTT ATGTATACAT CTG AATGAAAAG CAAAGCTAAATATGTTT AGA.GA 
CCAAAGTGTGATTTCACACTGTTTTTAAATCTAGCATTATTCATTTTGCTTCAATCAAAAGT 
GGTTTCAATATTTTTTTTAGTTGGTTAGAATACTTTCTTCATAGTCACATTCTCTCAACCTA 



TAAAAGCTACCAAT CTTT GT ACAATTTGTAAATG TTAAGAATTTTTTTT ATATCTGTTAAAT 
AAAAATT ATTT C CAAC A 
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FIGURE 246 

></usr/seqdb2/sst/DNA/Dnaseqs . min/ss . DNA76393 
xsubunit 1 of 1, 243 aa, 1 stop 
><MW: 26266, pi: 8.43, NX(S/T): 1 

MRPQGPAASPQRLRGLLLLLLLQLPAPSSASEIPKGKQKAQLRQREWDLYNGMCLQGPAGV 
PGRDGSPGANVIPGTPGIPGRDGFKGEKGECLRESFEESWTPNYKQCSWSSLNYGIDLGKIA 
ECTFTKMRSNSALRVLFSGSLRLKCRNACCQRWYFTFNGAECSGPLPIEAIIYLDQGSPEMN 
STINIHRTSSVEGLCSGIGAGLVDVAIWVGTCSDYPKGDASTGWNSVSRI I IEELPK 

Signal peptide: 

amino acids 1-30 

Transmembrane domain: 

amino acids 195-217 
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FIGURE 247 A 

PRO XXXXXXXXXXXXXXX (Length = 15 amino acids) 

Comparison Protein XXXXXYYYYYYY (Length = 12 amino acids) 

% amino acid sequence identity = 

(the number of identically matching amino acid residues between the two polypeptide 
sequences as determined by ALIGN-2) divided by (the total number of amino acid residues of 
the PRO polypeptide) = 

5 divided by 15 = 33.3% 
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FIGURE 247R 

PR0 XXXXXXXXXX . (Length = 10 amino acids) 

Comparison Protein XXXXXYYYYYYZZYZ (Length = 15 amino acids) 

% amino acid sequence identity = 

(the number of identically matching amino acid residues between the two polypeptide 
sequences as determined by ALIGN-2) divided by (the total number of amino acid residues of 
the PRO polypeptide) = 

5 divided by 10 = 50% 
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FI GURE 247C 



PRO-DNA 



NNNNNNNNNNNNNN (Length = 14 nucleotides) 

NNNNNNLLLLLLLLLL (Length = 16 nucleotides) 



Comparison DNA 



% nucleic acid sequence identity = 

(the number of identically matching nucleotides between the two nucleic acid sequences as 
determined by ALIGN-2) divided by (the total number of nucleotides of the PRO-DNA nucleic 
acid sequence) = 

6 divided by 14 = 42.9% 
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FIGURE 247D 



PRO-DNA 



NNNNNNNNNNNN 



(Length = 12 nucleotides) 

(Length = 9 nucleotides) 



Comparison DNA 



NNNNLLLVV 



% nucleic acid sequence identity = 

(the number of identically matching nucleotides between the two nucleic acid sequences as 
determined by ALIGN-2) divided by (the total number of nucleotides of the PRO-DNA nucleic 
acid sequence) = 

4 divided by 12 = 33.3% 
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FIGURE 248A 



* C-C increased from 12 to 15 

* Z is average of EQ 

* B is average of ND 

* maich with stop is M; stop-stop =■ 0; J (joker) match = 0 
*/ 

#define __M -8 /* value of a match with a stop */ 

int _day[26][261 = { 

P ABCDEFGHIJKLMNOPQRSTTJVWXYZ*/ 

/* A •/ { 2, 0,-2, 0, 0,-4, 1,-1,-1, 0,-1,-2,-1, 0,_M, I, 0.-2, 1, 1, 0. 0,-6, 0,-3. 0}, 

/* B */ { 0, 3,-4, 3. 2,-5. 0, 1,-2. 0. 0,-3,-2, 2,_M,-1, 1, 0, 0, 0, 0,-2,-5, 0,-3, I}, 

/* C */ {-2,-4,15,-5,-5,-4,-3,-3,-2, 0,-5.-6,-5,4, M,-3,-5.4. 0.-2, 0.-2,-8, 0, 0,-5}, 

/*D*/ {0,3.-5,4,3,-6, 1. 1,-2,0.0.-4,-3,2, M.-l, 2,-1, 0, 0, 0,-2,-7, 0,4, 2}, 

/• E */ { 0, 2,-5, 3, 4,-5, 0. 1,-2, 0. 0,-3,-2, I ,JV1,-1, 2,-1, 0, 0, 0,-2,-7, 0,-4, 3}, 

/* F */ {^-5.^,-6,-5. 9.-5,-2, t, 0,-5, 2, 0,-4, M.-5, -5,4,-3,-3, 0,-1, 0, 0, 7,-5}, 

t* G */ {1, 0,-3, 1, 0,-5, 5,-2,-3, 0,-2,-4,-3, 0,1*1,-1,-1,-3, 1, 0, 0,-1,-7, 0,-5, 0}, 

t* H */ {-1, 1,-3, 1, 1,-2,-2, 6.-2, 0, 0,-2,-2, 2,_M. 0, 3, 2,-1.-1. 0,-2,-3, 0, 0, 2}, 

/• I */ {-1,-2,-2,-2,-2. 1.-3.-2, 5, 0,-2, 2, 2,-2,_M,-2,-2.-2,-t, 0, 0, 4,-5. 0,-1,-2}. 

!* J */ {0. 0, 0, 0, 0, 0, 0. 0, 0. 0, 0, 0, 0, 0, M, 0, 0, 0, 0, 0, 0, 0, 0. 0, 0, 0}. 

/* K */ {-1, 0,-5, 0, 0,-5.-2, 0,-2, 0, 5,-3, 0, Cm,-1, 1, 3, 0, 0, 0,-2,-3, 0.-4, 0}. 

/* L */ {-2,-3,-6,4,-3, 2,4,-2, 2, 0,-3, 6, 4.-3,~M.-3,-2.-3,-3,-I t 0, 2,-2, 0.-1,-2}, 

/* M */ {-1,-2,-5,-3,-2. 0,-3,-2, 2, 0. 0, 4. 6,-2.~M,-2,-l, 0,-2,-1, 0. 2,-4, 0,-2,-1), 

/* N */ { 0, 2,-4, 2, 1,-4, 0, 2,-2. 0, 1,-3,-2, 2, M.-l, 1. 0, 1, 0, 0,-2,4, 0,-2, 1}. 

1*0*1 {_M,^M,_M,^M,_M,_M t _M,_M. M, M,_M,_M,_M,_M. 0,_M,_M, M, M._M, M,_M,_M, M, M, M}, 

(* P */ { 1,-1,-3,-1,-1,-5,-1, 0,-2, 0,-1,-3,-2,-1, M, 6, 0. 0, 1. 0, 0.-1,-6, 0,-57o}7 " - - - 

(*Q*f {0. 1,-5.2,2,-5,-1,3,-2.0, 1,-2.-1, 1 .~M. 0, 4. 1,-1,-1.0,-2,-5,0,-4,3}. 

/* R */ {-2, 0.-4,-1,-1,-4,-3, 2,-2, 0, 3,-3, 0. 0, M, 0, 1. 6, 0,-1. 0,-2. 2, 0,-4, 0}, 

/* S */ { 1, 0, 0, 0, 0.-3, 1,-1,-1, 0, 0,-3,-2, 1,~M, 1,-1, 0, 2, 1. 0,-1,-2, 0,-3. 0}, 

/♦ T »/ { 1, 0,-2. 0, 0,-3, 0,-1, 0, 0, 0,-1,-1, 0,_M, 0,-1,-1. 1, 3. 0, 0,-5, 0.-3. 0}, 

/* U */ {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,~M, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0), 

/* V */ { 0,-2,-2.-2,-2.-1,-1,-2, 4, 0,-2, 2. 2.-2, M.-l. -2,-2,-1, 0, 0, 4,-6, 0,-2,-2}, 

/• W */ {-6,-5.-8,-7,-7, 0.-7.-3.-5, 0,-3,-2,-4,-4, M,-6,-5, 2,-2,-5. 0,-6,17, 0, 0.-6}, 

/* X */ { 0. 0, 0, 0, 0, 0, 0, 0, 0, 0, 0. 0. 0, 0,_M, 0. 0, 0, 0, 0, 0, 0, 0. 0, 0. 0}, 

/♦ Y */ {-3.-3. 0,-4.-4, 7.-5, 0,-1, 0,4,-1, -2,~2,_M.-5,4,4,-3,-3, 0,-2, 0. 0.10,-4}, 

/* Z */ { 0, 1,-5, 2, 3,-5, 0, 2,-2, 0, 0,-2,-1, 1, M, 0, 3, 0, 0, 0, 0,-2,-6, 0,4, 4} 

}; 
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flndude <stdio.h> 
tfndude <ctype.h> 



ffdefine 



^define 
tfdefine 
^define 
^define 
tfdefine 



struct jmp { 

short 

unsigned short 

}; 

struct diag { 
bit 
long 



MAXJMP 


\6 


/* max jumps in a dtag *J 


MAXGAP 


24 


/* don't continue to penalize gaps larger than this */ 


J MPS 


1024 


/* max jmps in an path */ 


MX 


4 


/* save if there's at least MX-l bases since last jmp */ 


DMAT 


3 


/* value of matching bases */ 


DMIS 


0 


/* penalty for mismatched bases */ 


DINSO 


3 


/* penalty for a gap V 


DINS1 


1 


/* penalty per base V 


P1NS0 


8 


t* penalty for a gap V 


PINSi 


4 


/* penalty per residue */ 



}; 

struct path { 



struct jmp 



n[MAXJMPl; 
xfMAXJMP]; 



score: 
offset; 
ijmp; 

jp; 



/* size of jmp (neg for dely) */ 
/* base no. of jmp in seq x */ 
/* limits seq to 2*16-1 •/ 



/* score at last jmp •/ 
/♦ offcet of prev block •/ 
/* current jmp index */ 
/* list of jmps */ 





int 




short 


>; 


int 


char 




char 




char 




char 




Dt 




int 




int 




ini 




fnt 




int 




int 




tnt 




int 




long 




struct 


diag 


struct 


path 


char 




char 





spc; /* number of leading spaces */ 

n[JMPSJ; /* size of jmp (gap) •/ 

xfJMPSI;/* loc of jmp (last dem before gap) */ 



*ofile; 

*namex(2]; 

♦prog; 

*seqxP]; 

dmax; 

dmaxO; 

dna; 

endgaps; 
gapx, gapy; 
lenO, lenl; 
ngapx, ngapy; 
Smax; 
*xbm; 
offset; 
*dx; 
PP(21; 



/* output file name */ 

/* seq names: getseqsfj */ 

/* prog name for err msgs •/ 

/* seqs: getseqsO */ 

/• best diag: nwfj */ 

/* final diag */ 

/* set if dna: mainO */ 

/* set if penalizing end gaps */ 

/* total gaps in seqs */ 

/* seq lens */ 

/* total size of gaps */ 

/* max score: nw() */ 

/* bitmap for matching */ 

/* current offset in jmp file */ 

/* holds diagonals */ 

/• holds path for seqs */ 



♦callocO, •mallocO. *inuexO, *strcpy0; 
•getseqQ. *g_callocO; 
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/* Needleraan-Wunsch alignmeni program 

* usage: progs filel file2 

* where filel and file2 are cwo dna or two protein sequences. 

* The sequences can be in upper- or lower-case an may contain ambiguity 

* Any lines beginning with ' ; ' , ' > ' or ' < ' are ignored 

* Max file length is 65535 (limited by unsigned short x in the jmp struct) 

* A sequence with 1/3 or more of its elements ACCTU is assumed to be DNA 

* Output is in the file "align.out" 

* The program may create a tmp file in Amp to hold info about traceback. 

* Original version developed under BSD 4.3 on a vax 8650 
*/ 

include "nw.h" 
include "day.h" 

static _dbvalf26] = { 

1,14,2,13.0,0.4,11,0,0,12.0,3.15,0,0.0.5.6,8,8,7,9.0,10,0 

}: 



static _pbval[26] - { 

I, 2|(1 < <CD'-'A , ))|(1 < <('N'--A')), 4, 8, 16, 32, 64, 
128, 256, OxFFFFFFF, 1< <10, !<<U, 1< < 12, l< < 13. l<<14, 
1<<15, 1<<16, 1<<17, 1<<18. 1<<19, 1< <20. 1< <21, 1< <22. 
1<<23, 1<<24, 1<<25|(1<<CE , -'A'))|(K<CQ'.'A')) 



main(ac, av) main 
int ac; 
char *avQ; 

{ 

prog = avrO]; 
if (ac != 3) { 

fprintf(stdcrr. "usage: %s filel file2\n\ prog); 

rprmtf(stderr. "where filel and ftle2 are two dna or two protein sequencesAn"); 
fprimf(stderr,"The sequences can be in upper- or lower-case\n"); 
rprintf(siderr."Any lines beginning with or ' < ' are ignoredW); 
fprintf(stderr," Output is in the file \"align.out\"\n"); 
exit(l); 

} 

namex(01 = av[l]; 

namcxfl] = av|2J; 

seqx|0] = getseq(namexfO), AlenO); 

seqxfl] = getseq(namex[l]. &lenl): 

xbm = (dna)?_dbval : _pbval; 



endgaps = 0; /* 1 to penalize endgaps */ 

ofile =» "align.out"; /* output file */ 

nwO; /* fill in the matrix, get the passible jraps */ 

readjmpsO ; /* get the actual jmps V 

printO: /* print stats, alignment */ 

cleanup(0) : /♦ unlink any tmp files */ 
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/* do the alignment, return best score: mainO 

* dna: values in Fitch and Smith, PNAS, 80, 1382-1386 1983 

* pro: PAM 250 values 

* When scores are equal, we prefer mismatches to any gap, prefer 

* a new gap to extending an ongoing gap, and prefer a gap in seqx 

* to a gap in seq y. 
*l 

nw() 
{ 



char 


*px. -py: 


/* seqs and ptrs */ 


int 


•ndely, *dely; 


/"keep track of dely */ 


int 


ndelx, delx; 


/♦keep track of delx */ 


int 


*tmp; 


/* for swapping rowO, rowl */ 


int 


mis; 


/* score for each type */ 


int 


insO. insl; 


/* insertion penalties */ 


register 


id; 


/* diagonal index */ 


register 


ij; 


/* jmp index */ 


register 


»col0, *coll; 


. /* score for curr, last row */ 


register 


xx, yy; 


/* index into seqs */ 



dx = (struct diag ")g_ca[loc("to get diags", lenO+lenl + 1, sizcof(struct diag)); 

ndely = (int *)g_calloc("to get ndely", lenl + l, sizeoftfnt)); 
dely = (int •)g_calloc("to get dely", Ienl + 1, sneoftint)); 
coK) = (int *)g_calloc("to get colO", lenl + l, sizeoftfnt)); 
coll = (int *)g_callocfto get coll" , lenl + 1, sizeof(im)); 
insO = (dna)7 DINSO : PINSO; 
insl = (dna)? DINS I : PINS1; 

smax = -10000; 
if(endgaps){ 

for (colOlO] = dely[0I = -insO, yy = 1; yy < = lenl; yy + +) { 
col0[yy] = dely[yy] = coI0[yy-l] - insl; 
ndcly[yy] = yy; 

} 

coI0[01 = 0; /* Waterman Bull Math Biol 84 */ 



for(yy = 1; yy < = lenl; yy + +) 
dely[yyj = -insO; 

/* fill in match matrix 
*/ 

for (px = seqx[0], xx = 1; xx < = lenO; px + +, xx++) { 
/* initialize first entry in col 
*/ 

If (endgaps) { 

if (xx =»=> 1) 

coll[0] = delx = -(insO+insI); 

else 

coll[0] = delx = colO[0] - insl; 
ndelx = xx; 

} 

else { 

coll[0] = 0; 
delx = -insO; 
ndelx = 0; 

) 
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...nw 

for(py = seqxfl), yy = 1; yy < m loil; py+ + , yy++> { 
mis => coI0[yy-l]; 
if (dna) 

mis += (xbm[*px-•A , ]&xbra(*py- , A , ])? DMAT : DMIS; 

else 

mis + = _day{*px- , A'][*py- , A'l; 

/* update penalty for del in x seq; 

* favor new del over ongong del 

* ignore MAXGAP if weighting endgaps 
*/ 

if (endgaps 1 1 ndeiy(yy] < MAXGAP) { 

if (coiO[yy] - insO > - dely(yy]) { 

dclyby] - col0(yy] - (insO + insl); 
ndelyfyy] = 1; 

}else{ 

dely(yyj -= insl; 
ndely{yy]+ + ; 

} 

}else{ 

if (colOfyy] - (insO+insl) > = dely[yyl) { 
dely[yy) - colOtyy] - (insO+insl); 
ndelylyyj = 1; 

}else 

ndely[yy]+ + ; 

> 

/♦ update penalty for del in y seq; 

* favor new del over ongong del 
*/ 

if (endgaps | J ndelx < MAXGAP) { 

if(coll[yy-l]-insO> = delx){ 

delx - colllyy-lj - (insO+insl); 
ndelx - 1; 

}else{ 

delx-= insl; 
ndelx++; 

} 

}else{ 

if (coll[yy-lJ - (insO+insl) > - delx) { 
delx = colllyy-1] - (insO+insl); 
ndelx = 1; 

}ebe 

ndelx++; 

} 

/* pick the maximum score; we're favoring 

* mis over any del and delx over deiy 
V 



J2St /Z 7t> 
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...nw 

id => xx - yy + Icnl - 1; 

if (mis > - deix && mis > = deiy(yyj) 

coll[yy] = mis; 
else if (delx > = dely[yy]) { 

coll[yyj =» delx: 

ij = dx[id].ijmp; 

if (dx[id].jp.n{0) && (!dna 1 1 (ndcix > = MAXJMP 
&& xx > dx[idj.jp.x[ij]+MX) j | mis > dx[id).score+DINSO)) { 
dx(id].ijmp+ + ; 
if( + + ij > = MAXJMP) { 
writejmps(id); 
ij = dxfidj.ijmp = 0; 
dx[idj. offset = offset; 

offset += sizeof(stnictjmp) + sireof(offset); 

} 

} 

dx[id].jp.n{ij] = ndelx; 
dxlidj.jp.xjjj] = xx; 
dx(id). score = defx; 

} 

else { 

coll[yy] = dely[yy]; 
\j => dx(id].ijmp; 

if (dx[id].jp.n(0] && (!dna 1 1 (ndely(yy] > = MAXJMP 

&&xx > dx[id].jp.x[ij]+MX) 1 1 mis > dx[id].score+DINSO)).{ 
dx(id].ijmp++; 
if (++ij > = MAXJMP) { 
whtejmps(id); 
ij = dx[id].ijmp = 0; 
dx(id].offset = offset; 

offset + = sbceof(struct jmp) + sfaeof(offset); 

} 

> 

dx[id].jp.n[ij] - -ndely[yy]; 
dx[id].jp.x[ij] = xx; 
dx[id] .score = dely[yyj; 

} 

if (xx = = lenO && yy < lenl) { 
/* last col 
*/ 

if (endgaps) 

coll[yy] - = insO+insl*(Ienl-yy); 
if (coll[yyJ > smax) { 

smax = coll[yyJ; 

dmax = id; 

} 

} 

> 

if (endgaps && xx < lenO) 

coUfyy-1] -= jnsO+insl*(lcnO-xx); 
if (colI[yy-l] > smax) { 

smax = coll [yy-1]; 

dmax = id; 

} 

tmp = colO; colO = coll; coll = Unp; 

(void) free((cfaar *)ndely); 
(void) free<(cliar *)dely); 
(void) free<(cbar *)co!0); 
(void) free((cliar *)coll); 
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* printO - only routine visible outside this module 
* 

♦static: 

* getmatO - trace back best path, count matches: priruO 

* pr_alignO - prim alignment of described in array p(J: printO 

* dumpblockO - dump a block of lines with numbers, stars: pr_alignO 

* numsO - put out a number line: dumpblockO 

* putltneO - put out a line (name, [num], seq, (num]): dumpblockO 

* starsO - -put a line of stars: dumpblockO 

* stripnameO - strip any path and prefix from a seqname 
*/ 

^include "nw.h" 



eSPC 3 
fdefine P_UNE 256 /* maximum output line ♦/ 
Idefine P SPC 3 /* space between name or num and scq */ 

extern _day(26]f26]; 

int olen; /* set output line length */ 

FILE fx; f* output file */ 

printo print 

Int Ix, ly. firstgap, lastgap; P overlap */ 

if ((fit = fopen(ofile. "w")) == 0) { 

rprinrf(stderr,"%s: can't write %s\a\ prog, ofile); 
cleanupd); 

} 

rprintf(fx, "< first sequence: %s (length = %d)\n", namex(0J. lenO): 
rprinrfXfx, "< second sequence: %s (length = %d)\n", namex[l], lenl); 
olen = 60; 
lx - lenO; 
ly = lenl; 

firstgap = lastgap = 0; 

if (dmax < lenl - 1) { P leading gap in x "/ 
pp[0).spc = firstgap = lenl - dmax - 1; 
ly-= pp[0].spc; 

) 

eke if (dmax > lenl - 1) { /* leading gap in y */ 
pp(l].spc = firstgap = dmax - (lenl - I); 
ix -= pp[l].spc; 

} 

if (dmaxO < lenO - 1) { /* trailing gap in x ■/ 
lastgap = lenO - dmaxO -1 ; 
lx -=» lastgap; 

} 

else if (dmaxO > lenO - 1) { /* trailing gap in y *A 
lastgap = dmaxO - (lenO - 1); 
ly •= lastgap; 

} 

getmat(lx, ly, firstgap, lastgap); 
pralignO: 
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* trace back the best path, count matches 
*/ 

static 

getmat(lx. ly. firstgap, lastgap) 

1*. ly;~ /* "core- (minus endgaps) */ 

^ int firstgap, lastgap; /* leading trailing overlap V 

tat run, i0. il, sizO, sizl; 

char outx[32]; 

double pa; 

register nO.nl; 

register char *p0, *pl; 

/* get total matches, score 
•/ 

iO = il m sizO = sizl = 0; 
pO = seqx[0) + pp(lj.spc; 
pi = seqx[l] + ppfOl.spc; 
nO = pp[l].spc + 1; 
nl = pp[0].spc + 1; 

run = 0; 

whiJe(*pO&&*pl ) { 
if (sizO) { 

pi ++; 
nl + +; 
sizO--; 

} 

else if (sizl) { 

p0+ + ; 



> 

else { 



nO+ + ; 
sizl-; 



if (xbm(*pO-* A'l&xbmt^l-'A]) 

nm+ + ; 
If(n0+ + = - pp{01.x[i0]) 

sizO = pp[OJ.n{iO++l; 
if(nl + + ==pp[l].x[ilj) 

sizl » pp[l].n(il ++]; 

p0++; 
pl + + ; 



} 



/* pet homology: 

* if penalizing endgaps, base is the shorter scq 

* else, knock off overhangs and take shorter core 
*/ 

If (endgaps) 

Ix = (lenO < lenl)?len0: lenl; 

else 

lx = (Ix < ly)? Ix : ly; 
pet = 100.*(double)nm/(doubte)lx; 
fprintf(fx, "\n"); 

fprimf(fx. " < %d match %s in an overlap of %d: %.2f percent similariry\n 
ran, (nm » « 1)? " ; " e $\ Ix, pa); 
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fprintf(fx, " < gaps in first sequence; %d", gapx); .getmat 
it (gap*) { 

(void) sprintf(outx, " (%d %s%s)", 

ngapx. (dna)? "base": 'residue", (ngapx «- 1)? *":V); 

fprmtf<fx,"%s",ourx); 

fprimf(fx, \ gaps in second sequence: %'d", gapy): 
if(gapy){ 

(void) sprintf(outx, " (%d %s%s)", 

ngapy, (dna)? "base": "residue", (ngapy »- I)? ":V); 

fprintt(fx,"%s". outx); 

} 

if (dna) 

fprintf(fx, 

"\n< score: %d (match » %d, mismatch = %d, gap penalty - %d + %d per base)\n\ 
smax. DMAT, DMIS, DINSO, DINS1); 

else 

fprintf(fx, 

"\n< score: %d (Dayhoff PAM 250 matrix, gap penalty - %d + %d per residue)\n", 4 
smax, PDVSO. PINS1); 
if (endgaps) 

fprintf(fx, 

"< endgaps penalized, leftendgap: %d %s%s, right endgap: %d %s%s\n", 
firstgap, (dna)? "base" : "residue", (firstgap =.= 1)? "" : V, 
lastgap, (dna)? "base" : "residue", (lastgap == 1)? : V); 

else 

fprintf(fx, "< endgaps not penalizcd\n"); 



static 


run; 


/* matches in core - for checking */ 


static 


tmax; 


/* lengths of stripped file names */ 


static 


ijPl; 


/*jmp index for a path */ 


static 


nc[21; 


/* number at start of current line */ 


static 


nil2J; 


/* current clem number - for gapping */ 


static 


siz[2); 


static char 




/* ptr to current element */ 


static char 


•poC2]: 


/* ptr to next output char slot ■/ 


static char 


out[2][P_LINE]; 


/* output line */ 


static char 


star[P__UNE]; 


f* set by starsQ */ 



* print alignment of described in struct path ppQ 
static 

prjdignO prjilign 

int nn; /* char count */ 

int more; 
register i; 

for (i ■ 0, hnax - 0; i < 2; i+ +) { 
nn = stripname{namextij); 
if (nn > lmax) 

Imax - nn; 

nc[i] = I; 
ni[il = I; 
siz[il = ij[il - 0: 
ps(i] = seqx(i]; 
po{i] = out(t]; 
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for Cnn = nm - 0. more = 1; more; ) { ...pr align 

for (i = more » 0; i < 2; i+ +) { 
I* 

* do we have more of this sequence? 
*/ 

tf(!*ps[i]) 

continue; 

more+ + ; 

if (PprO spc) { /• leading space */ 
*po[i] + + = 
pp[ij.spc-; 

} 

else if (si2[il) { /* in a gap */ 
*po(i] + + - 

} 

else { /* we're puning a seq element 

*/ 

•pom = *ps[i]; 
if(islower(*ps[i])) 

*ps[i] = wupper(*ps[i]); 

po01++; 
PSW+ + ; 

/* 

* are we ai next gap for this seq? 
*/ 

lf(mra«ppCiU[ij[n]){ 

/* 

* we need to merge all gaps 

* at (his location 
•/ 

siz(il = pp[i].n[ij[i]++]; 
while (ni[i] " pp(iJ.*fij[ilD 

siz(i] ppli].n(ij[i] ++]; 

} 

m[i] + + ; 

} 

} 

if (+ +im * = olen 1 1 !more && nn) { 
dumpblockO: 
ror(i - 0; i < 2; 

poli] - out[i]; 

nn = 0; 

} 

} 

} 

* dump a block of lines, including numbers, stars: pr_aiign() 
static 

dumpblockO dumpblock 
register i; 

for (i = 0; i < 2; i + +) 
*po[i]- = '\0'; 
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(void) putcf\n'. fx); 
for(i = 0; i < 2; i ++) { 

if (*oui[i] && (*out[i] != * ' 1 1 *(po[\)) != -)) { 
if(i =-0) 

nums(i); 
if (i ~ 0&&*outll]) 
starsO; 

putline(i); 

If (i - - 0 &A *out(lJ) 

rprimf(fx, star): 
if (i « 1) 

nums(i); 



} 
/* 

' put out a number line: dumpblockO 
•/ 

static 
nums(ix) 



FIGURE 248K 

...dumpblock 



{ 



>nt ix; /* index in outQ holding seq line */ 

nlinefPJLJNEJ; 
i.j: 

♦pn, *px, *py; 

ror (pn - niine, i = 0; i < lmax+P_SPC; i++, pn++) 
*pn = ' 

for (i = nc[ix], py = out[ix]; *py; py+ + , pn++) { 
lf(*py=-" M *py~ V) 
*pn — " 'j 



nums 



ebe{ 



} 



} 
} 

*pn = '\0'; 
ncpxj = i; 

for (pn = niine; *pn; pn+ +) 
(void) putc(*pn, fx); 
(void) putc(*\n\ fx); 



if (i%10 ==0 || 0 == l&&nc[ix] != 1)) { 
j - (i < 0)? -i : i; 
for (px = pn; j; j /= 10, px-) 
*px =j%10 + '0'; 

if(i < 0) 

»px = v- 

} 

else 

> = ' ': 



•put out a line (name, [numl. seq, [num]): clurnpblockO 



pudine<ix) putline 
int ix; 

{ 
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...putline 

int i; 
register char *px; 

for(px - oamexlix], i = 0; *px && *px != px+ + , 

(void) putc(*px ( fx): 
for(; i < lmax+P_SPC; i++) 

(void)putc(' \ fx): 

/* these count from 1 : 

* ni(] is current element (from 1) 

* ncrj is number at start of current line 
•/ 

for(px - outfix]; *px; px++) 

(void) putc(*px&0x7F, fx); 
(void)putcC\n', fx); 

} 



/* 

* put a line of stars (seqs always in out[0], out(U): dumpblock() 
V 

static 

starsO Stars 
{ 

int i; 

register char *pO, *pl. cx, *px; 

If (!*out[0] 1 1 (*out(0J — " && *(po[01) == ' ') 1 1 
!*outfU j | (♦outfll = = ' ' && *(po[l]) -« ' ')) 
return; 
px = star; 

for (i = lmax+P_SPC; i; i~) 
*px++ » ' 

for (pO = outfOJ. pl = out(lJ; *p0 && *pl; pO+ +, pl + +) { 
if (isalpha(*pO) && tsalpba(*pl)) { 

if (xbm(*pO-'A']&xbin[*pl- , A , :|) { 
cx a 
um+ + ; 

} 

elseif(!dna&& _day[*pO- , A'J[*pl- , A , J > 0) 
cx = 

else 

cx - ' '; 

} 

else 

cx « ' '; 
*px+ + = cx; 

} 

•p*++ - 'W; 
•px = *\0'; 

) 
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/* 

* strip path or prefix from pn, return len: pr alignO 
*/ 

static 

stripname<pn) stripname 

char *pn; /* file name (may be path) */ 
register char *px, *py; 
py «0; 

for(px » pn; *px; px++) 
lf(*px — T) 

py - px + 1; 

if(py) 

(void) strcpy(pn, py); 
return(sirlen(pn)); 
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* deanupO cleanup any tmp file 

* getseqO - read in seq, ser dna. len, maxlen 

* g_callocO - cailocO with error checkin 

* readjmpsO - get the good jmps, from tmp file if necessary 

* wrilejmpsO - write a filled array of jmps to a tmp file: nwO 
*/ 

tfnclnde *nw.h" 
tfincrade <sys/file.h> 



char 
FILE 

int 
long 



♦jname • 

cleanupO; 
IseekO; 



"/tmp/homgXXXXXX"; 



/* 

* remove any tmp file if we blow 
•/ 

cleanup(i) 



{ 



int 

if(rj) 

exit(i); 



(void) unlink(jname); 



/* tmp file for jmps */ 
/* cleanup tmp file */ 



cleanup 



* read, return ptr to seq, set dna, len, maxlen 

* skip lines starting with ' < \ or >' 

* seq in upper or lower case 
*/ 

char 

getseq(file, len) 



{ 



♦file; 
♦len: 



register char 
bit . 
FILE 



/* file name */ 
/* seq len */ 

line(1024J, •pseq; 
*px, *py; 
natgc, lien; 



getseq 



If ((fp = fooenCfile.-r-)) == 0) { 

fprintf(stderr."%s: can t read %s\n\ prog, file); 
exit(l); 

) 

tlen = natgc = 0; 

while (fgets<line, 1024, fp)) { 

lf(*line -« ';' || *line ' <> |j *line= = >•) 

continue; 
for(px - line; *px »« 'V;px++) 

if (isupper(*px) 1 1 islower(*px)) 
tlen+ + ; 

} 

if ((pseq = malloc((unsigned)<den+6))) == 0) { 

fprintf(stderr,"%s: mallocO failed to get %d bytes for %s\n", prog, den +6, file); 
exit(l); 

} 

pseq[0] = pseq[l] = pseq[2] « pseq[3J = '\0'; 
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> 



py = pseq + 4; 
*len - lien; 
rcwind(rp); 

while (fge!5(line, 1024, fp)) { 

if(*Unc== || *line || *line == •>') 

continue; 

for(px = line; *px != '\n'; px++) { 
ir (isupper(*px» 

*py++ = *px; 
else If (islower(*px)) 

*py++ = toupper(*px); 
if (imtex(-ATGCU\*(py-l))) 

natgc + + ; 

) } 

*py + + « '\0'; 

•pv = '\0'; 

(void) fclose(rp); 

dna = natgc > (tlen/3); 

return(pseq+4); 



char * 

g_calloc(msg. nx. sz) 



{ 



} 



g_calloc 

„« B , /* program, calling routine */ 

int nx, sz; /* number and size of elements */ 

char *px, *callocO; 

if ((px ■ calloc((unsigned)nx, (unsigned)sz)) = = 0) { 
if(*msg){ 

fprinrf(stderr f '%s: g_calloc0 failed %s (n=%d. sz = %d)ui\ prog. msg. ox, szV 
exit(l); D 

} 

} 

return(px); 



t* 

*get final jmps from dx[j or trap file, set ppQ, reset dmax: mainO 

P djmps0 readjmps 



int fd - -I; 

int siz, K), il; 

register i.j, xx; 

if(rj){ 

(void) fclose(fj); 

if ((fd = open(jname, O RDONLY, 0)) < 0) { 

fprintf(stderr, "%s: can't opcnO %s\n", prog, jname); 
cleanup(l); 

} 

} 

for (i = t0 - il = o. dmaxO = dmax, xx » lenO; ; i+ +) / 

for (j = dx[dmax].ijmp; j > - 0 && dx[dmaxj.jp.xrj] > = xx; j-) 
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...readjmps 

if 0 < 0 && dx(dmax].offset fj) { 

(void) kcck(fd, dxfdmax]. offset, 0); 

(void) readtfd, (char *)&dx[dmax] jp, sizeof(sinict jmp)); 

(void) readtfd, (char *)&dx(dmax].offset, si2eof(dx[dmax1.offset)); 

dx[dmax].ijmp = MAXJMP-1; 

else 

break; 

} 

if a > = jmps) { 

fprintf(stderr, "%s: too many gaps in alignments", prog); 
cieanup(l); 

) 

ir(j > = 0){ 

siz = dx[dmax].jp.nfj]; 
xx - dxCdraax].jp.x|j]; 
dmax + = siz; 

if (siz < 0){ /* gap in second seq */ 

PP[1I n{«] = -siz; 
xx + = siz; 

/* id = xx - yy + lenl - 1 
*/ 

pp[lj.x[il] = xx - dmax + lenl - 1; 
gapy++; 
□gapy -= siz; 
/* ignore MAX GAP when doing endgaps ♦/ 

siz » (-siz < MAXGAP 1 1 endgaps)? -siz : MAXGAP; 
il + +; 

} 

else if (siz > 0) { /* gap in first seq */ 
po(0J.n[i0] = siz; 
pp{0].x[i0] = xx; 
gapx++; 
ngapx siz; 
/* ignore MAXGAP when doing endgaps */ 

siz = (siz < MAXGAP | j endgaps)? siz : MAXGAP; 
K>++; 

} 

} 

else 

break; 

} 

/* reverse the order of jmps 
•/ 

for (j = 0, K)— ; j < iO; j + + , »-) { 

i - pptP].nrj]; ppfOl.nfj] - pp[0].n[i0]; pp[0].n[K>] = i; 
^ i = pp[0].xfjl; pp[0].xfjj = pp[0].x(iO]; pp[0].x(i0] - i; 

for(j = 0. il-; j < 11; j + + , il-) { 

i = ppM-ntf; ppm.nfj) «□ pp[l].n[il]; pp[l].n(il] = i; 
' = PPm.*UJ; PPlU.xUl = PP[l].xtill; ppll].x(il] = i; 

if <fd >«0) 

(void) close(fd); 

(void) unlink(|name); 
fj -0; 
offset = 0; 

} 



} 
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V* 

* write a filled jmp struct offset of the prev one (if any): nw() 
*/ 

writejmps<ix) witejmps 

tat U; r 
{ - 
char •mlaempO; 

if(!fj){ 

if (mktemp(jname) < 0) { 

fprintf(stderT, "%s: can'i mktempO %s\n", prog, jname); 
deanup(l); 

> 

If ((fj = fopen(jiiame, "w")) == 0) { 

fprintf(stderr, "%s: can't write %s\n\ prog, jname); 
exitfl); 

> 

} 

(void) fwrite((char *)&dx[ix].jp, sizeoflstruct jmp). 1, fj); 
(void) fwrite((char *)&dx[ix].offset, sixeof(dx(«]. offset), 1, fj); 
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